@inproceedings{bb205700, AUTHOR = "Gillespie, W.J. and Nguyen, D.T.", TITLE = "Video Classification Using a Tree-Based RBF Network", BOOKTITLE = ICIP05, YEAR = "2005", PAGES = "III: 465-468", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200807"} @inproceedings{bb205701, AUTHOR = "Tweed, D. and Fisher, R.B. and Bins, J. and List, T.", TITLE = "Efficient Hidden Semi-Markov Model Inference for Structured Video Sequences", BOOKTITLE = PETS05, YEAR = "2005", PAGES = "247-254", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200808"} @inproceedings{bb205702, AUTHOR = "Leung, R. and Taubman, D.S.", TITLE = "Impact of Motion on the Random Access Efficiency of Scalable Compressed Video", BOOKTITLE = ICIP05, YEAR = "2005", PAGES = "III: 169-172", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200809"} @inproceedings{bb205703, AUTHOR = "Divakaran, A. and Vetro, A. and Sun, H.F.", TITLE = "Method for representing and comparing multimedia content according to rank", BOOKTITLE = US_Patent, YEAR = "2008", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200810"} @inproceedings{bb205704, AUTHOR = "Xie, L.X. and Chang, S.F. and Divakaran, A. and Sun, H.F.", TITLE = "Mining Statistical Video Structures", BOOKTITLE = VideoMining03, YEAR = "2003", PAGES = "Chapter 10", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200811"} @inproceedings{bb205705, AUTHOR = "Samson, V. and Bouthemy, P.", TITLE = "Learning classes for video interpretation with a robust parallel clustering method", BOOKTITLE = ICPR04, YEAR = "2004", PAGES = "IV: 569-572", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200812"} @inproceedings{bb205706, AUTHOR = "Satoh, S.", TITLE = "Generalized Histogram: Empirical Optimization of Low Dimensional Features for Image Matching", BOOKTITLE = ECCV04, YEAR = "2004", PAGES = "Vol III: 210-223", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200813"} @inproceedings{bb205707, AUTHOR = "Teraguchi, M. and Masumitsu, K. and Echigo, T. and Sekiguchi, S. and Etoh, M.", TITLE = "Rapid generation of event-based indexes for personalized video digests", BOOKTITLE = ICPR02, YEAR = "2002", PAGES = "II: 1041-1044", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200814"} @inproceedings{bb205708, AUTHOR = "Park, S. and Golshani, P.", TITLE = "Video Composition and Retrieval", BOOKTITLE = ICME00, YEAR = "2000", PAGES = "TP11", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200815"} @inproceedings{bb205709, AUTHOR = "Loui, A.C. and Savakis, A.E.", TITLE = "Automatic image event segmentation and quality screening for albuming applications", BOOKTITLE = ICME00, YEAR = "2000", PAGES = "TP10", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200816"} @inproceedings{bb205710, AUTHOR = "Kurokawa, M.", TITLE = "Representation and Retrieval of Video Scene by Using Object Actions and Their Spatio-temporal Relationships", BOOKTITLE = ICIP99, YEAR = "1999", PAGES = "II:86-90", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200817"} @inproceedings{bb205711, AUTHOR = "Vinod, V.V.", TITLE = "Activity Based Video Shot Retrieval and Ranking", BOOKTITLE = ICPR98, YEAR = "1998", PAGES = "Vol I: 682-684", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200818"} @article{bb205712, AUTHOR = "Swanberg, D. and Shu, C.F. and Jain, R.C.", TITLE = "Knowledge-Guided Parsing in Video Databases", JOURNAL = SPIE, VOLUME = "1908", YEAR = "1993", MONTH = "February", PAGES = "13-24", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT200819"} @article{bb205713, AUTHOR = "Saraceno, C. and Leonardi, R.", TITLE = "Indexing audiovisual databases through joint audio and video processing", JOURNAL = IJIST, VOLUME = "9", YEAR = "1999", NUMBER = "5", PAGES = "320-331", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200820"} @inproceedings{bb205714, AUTHOR = "Saraceno, C. and Leonardi, R.", TITLE = "Identification of Successive Correlated Camera Shots Using Audio and Video Information", BOOKTITLE = ICIP97, YEAR = "1997", PAGES = "III: 166-169", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200821"} @inproceedings{bb205715, AUTHOR = "Saraceno, C. and Leonardi, R.", TITLE = "Audio-visual processing for scene change detection", BOOKTITLE = CIAP97, YEAR = "1997", PAGES = "II: 124-131", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200822"} @article{bb205716, AUTHOR = "Li, D.G. and Sethi, I.K. and Dimitrova, N. and McGee, T.", TITLE = "Classification of general audio data for content-based retrieval", JOURNAL = PRL, VOLUME = "22", YEAR = "2001", NUMBER = "5", MONTH = "April", PAGES = "533-544", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200823"} @article{bb205717, AUTHOR = "Tsekeridou, S. and Pitas, I.", TITLE = "Content-based video parsing and indexing based on audio-visual interaction", JOURNAL = CirSysVideo, VOLUME = "11", YEAR = "2001", NUMBER = "4", MONTH = "April", PAGES = "522-535", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200824"} @inproceedings{bb205718, AUTHOR = "Tsekeridou, S. and Pitas, I.", TITLE = "Speaker dependent video indexing based on audio-visual interaction", BOOKTITLE = ICIP98, YEAR = "1998", PAGES = "I: 358-362", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200825"} @inproceedings{bb205719, AUTHOR = "Tsekeridou, S. and Krinidis, S. and Pitas, I.", TITLE = "Scene Change Detection Based on Audio-Visual Analysis and Interaction", BOOKTITLE = "WTRCV01", YEAR = "2001", PAGES = "214", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200826"} @article{bb205720, AUTHOR = "Kyperountas, M. and Kotropoulos, C. and Pitas, I.", TITLE = "Enhanced Eigen-Audioframes for Audiovisual Scene Change Detection", JOURNAL = MultMed, VOLUME = "9", YEAR = "2007", NUMBER = "4", PAGES = "785-797", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200827"} @article{bb205721, AUTHOR = "Gauvain, J.L. and Lamel, L. and Adda, G.", TITLE = "Audio Partitioning and Transcription for Broadcast Data Indexation", JOURNAL = MultToolApp, VOLUME = "14", YEAR = "2001", NUMBER = "2", MONTH = "June", PAGES = "187-200", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200828"} @article{bb205722, AUTHOR = "Amir, A. and Srinivasan, S. and Efrat, A.", TITLE = "Search the Audio, Browse the Video: A Generic Paradigm for Video Collections", JOURNAL = JASP, VOLUME = "2003", YEAR = "2003", NUMBER = "2", MONTH = "February", PAGES = "209", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200829"} @article{bb205723, AUTHOR = "Beal, M.J. and Jojic, N. and Attias, H.T.", TITLE = "A graphical model for audiovisual object tracking", JOURNAL = PAMI, VOLUME = "25", YEAR = "2003", NUMBER = "7", MONTH = "July", PAGES = "828-836", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200830"} @inproceedings{bb205724, AUTHOR = "Beal, M.J. and Attias, H.T. and Jojic, N.", TITLE = "Audio-Video Sensor Fusion with Probabilistic Graphical Models", BOOKTITLE = ECCV02, YEAR = "2002", PAGES = "I: 736 ff.", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200831"} @inproceedings{bb205725, AUTHOR = "Wu, P. and Li, Y. and Tretter, D.", TITLE = "Scalable video summarization", BOOKTITLE = US_Patent, YEAR = "2006", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200832"} @article{bb205726, AUTHOR = "Gong, Y.H.", TITLE = "Summarizing Audiovisual Contents of a Video Program", JOURNAL = JASP, VOLUME = "2003", YEAR = "2003", NUMBER = "2", MONTH = "February", PAGES = "160", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200833"} @inproceedings{bb205727, AUTHOR = "Gong, Y.H. and Liu, X.", TITLE = "Method and system for segmentation, classification, and summarization of video images", BOOKTITLE = US_Patent, YEAR = "2006", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200834"} @inproceedings{bb205728, AUTHOR = "Liu, X. and Gong, Y.H.", TITLE = "Method and system for segmentation, classification, and summarization of video images", BOOKTITLE = US_Patent, YEAR = "2006", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200834"} @inproceedings{bb205729, AUTHOR = "Gong, Y.H. and Liu, X.", TITLE = "Creating audio-centric, image-centric, and integrated audio-visual summaries", BOOKTITLE = US_Patent, YEAR = "2005", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200835"} @inproceedings{bb205730, AUTHOR = "Gong, Y.H. and Liu, X.", TITLE = "Video Summarization using Singular Value Decomposition", BOOKTITLE = CVPR00, YEAR = "2000", PAGES = "II: 174-180", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200836"} @inproceedings{bb205731, AUTHOR = "Gong, Y.H. and Liu, X.", TITLE = "Video Shot Segmentation and Classification", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol I: 860-863", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200837"} @article{bb205732, AUTHOR = "Wang, H.L. and Divakaran, A. and Vetro, A. and Chang, S.F. and Sun, H.F.", TITLE = "Survey of compressed-domain features used in audio-visual indexing and analysis", JOURNAL = JVCIR, VOLUME = "14", YEAR = "2003", NUMBER = "2", MONTH = "June", PAGES = "150-183", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200838"} @article{bb205733, AUTHOR = "Naphade, M.R.", TITLE = "On supervision and statistical learning for semantic multimedia analysis", JOURNAL = JVCIR, VOLUME = "15", YEAR = "2004", NUMBER = "3", MONTH = "September", PAGES = "348-369", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200839"} @article{bb205734, AUTHOR = "Naphade, M.R. and Kozintsev, I.V. and Huang, T.S.", TITLE = "A factor graph framework for semantic video indexing", JOURNAL = CirSysVideo, VOLUME = "12", YEAR = "2002", NUMBER = "1", MONTH = "January", PAGES = "40-52", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200840"} @inproceedings{bb205735, AUTHOR = "Naphade, M.R. and Kozintsev, I.V. and Huang, T.S. and Ramchandran, K.", TITLE = "A factor graph framework for semantic indexing and retrieval in video", BOOKTITLE = CBAIVL00, YEAR = "2000", PAGES = "35-39", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200841"} @inproceedings{bb205736, AUTHOR = "Naphade, M.R. and Huang, T.S.", TITLE = "Detecting Semantic Concepts Using Context and Audio/Visual Features", BOOKTITLE = EventVideo01, YEAR = "2001", PAGES = "92-98", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200842"} @inproceedings{bb205737, AUTHOR = "Naphade, M.R. and Huang, T.S.", TITLE = "Recognizing High-level Audio-visual Concepts Using Context", BOOKTITLE = ICIP01, YEAR = "2001", PAGES = "III: 46-49", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200843"} @inproceedings{bb205738, AUTHOR = "Naphade, M.R. and Huang, T.S.", TITLE = "Semantic Video Indexing Using a Probabilistic Framework", BOOKTITLE = ICPR00, YEAR = "2000", PAGES = "Vol III: 79-84", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200844"} @inproceedings{bb205739, AUTHOR = "Naphade, M.R. and Huang, T.S.", TITLE = "A Probabilistic Framework for Semantic Indexing and Retrieval in Video", BOOKTITLE = ICME00, YEAR = "2000", PAGES = "MP9", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200845"} @inproceedings{bb205740, AUTHOR = "Naphade, M.R. and Huang, T.S.", TITLE = "Inferring Semantic Concepts for Video Indexing and Retrieval", BOOKTITLE = ICIP00, YEAR = "2000", PAGES = "Vol III: 766-769", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200846"} @inproceedings{bb205741, AUTHOR = "Naphade, M.R. and Kristjansson, T. and Frey, B.J. and Huang, T.S.", TITLE = "Probabilistic multimedia objects (multijects): a novel approach to video indexing and retrieval in multimedia systems", BOOKTITLE = ICIP98, YEAR = "1998", PAGES = "III: 536-540", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200847"} @article{bb205742, AUTHOR = "Xie, X. and Lu, L. and Jia, M. and Li, H. and Seide, F. and Ma, W.Y.", TITLE = "Mobile Search With Multimodal Queries", JOURNAL = PIEEE, VOLUME = "96", YEAR = "2008", NUMBER = "4", MONTH = "April", PAGES = "589-601", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200848"} @article{bb205743, AUTHOR = "Kiranyaz, S. and Gabbouj, M.", TITLE = "Generic content-based audio indexing and retrieval framework", JOURNAL = VISP, VOLUME = "153", YEAR = "2006", NUMBER = "3", MONTH = "June", PAGES = "285-297", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200849"} @article{bb205744, AUTHOR = "Monaci, G. and Jost, P. and Vandergheynst, P. and Mailhe, B. and Lesage, S. and Gribonval, R.", TITLE = "Learning Multimodal Dictionaries", JOURNAL = IP, VOLUME = "16", YEAR = "2007", NUMBER = "9", MONTH = "September", PAGES = "2272-2283", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200850"} @inproceedings{bb205745, AUTHOR = "Zhang, T.", TITLE = "Using background audio change detection for segmenting video", BOOKTITLE = US_Patent, YEAR = "2007", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200851"} @article{bb205746, AUTHOR = "Kotti, M. and Ververidis, D. and Evangelopoulos, G. and Panagakis, I. and Kotropoulos, C. and Maragos, P. and Pitas, I.", TITLE = "Audio-Assisted Movie Dialogue Detection", JOURNAL = CirSysVideo, VOLUME = "18", YEAR = "2008", NUMBER = "11", MONTH = "November", PAGES = "1618-1627", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200852"} @article{bb205747, AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.", TITLE = "Audio-Visual Event Recognition in Surveillance Video Sequences", JOURNAL = MultMed, VOLUME = "9", YEAR = "2007", NUMBER = "2", MONTH = "February", PAGES = "257-267", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200853"} @inproceedings{bb205748, AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.", TITLE = "Audio-Visual Foreground Extraction for Event Characterization", BOOKTITLE = SLAM06, YEAR = "2006", PAGES = "116", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200854"} @inproceedings{bb205749, AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.", TITLE = "Audio-Video Integration for Background Modelling", BOOKTITLE = ECCV04, YEAR = "2004", PAGES = "Vol II: 202-213", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200855"} @article{bb205750, AUTHOR = "Zeng, Z.H. and Tu, J.L. and Liu, M. and Huang, T.S. and Pianfetti, B. and Roth, D. and Levinson, S.", TITLE = "Audio-Visual Affect Recognition", JOURNAL = MultMed, VOLUME = "9", YEAR = "2007", NUMBER = "2", MONTH = "February", PAGES = "424-428", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200856"} @article{bb205751, AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B.M. and Huang, T.S.", TITLE = "Audio-Visual Affective Expression Recognition Through Multistream Fused HMM", JOURNAL = MultMed, VOLUME = "10", YEAR = "2008", NUMBER = "4", MONTH = "June", PAGES = "570-577", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200857"} @inproceedings{bb205752, AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B. and Liu, M. and Zhang, T. and Zhang, Z.Q. and Huang, T.S. and Levinson, S.", TITLE = "Audio-Visual Affect Recognition through Multi-Stream Fused HMM for HCI", BOOKTITLE = CVPR05, YEAR = "2005", PAGES = "II: 967-972", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200858"} @article{bb205753, AUTHOR = "Zhang, S.L. and Huang, Q.M. and Jiang, S. and Gao, W. and Tian, Q.", TITLE = "Affective Visualization and Retrieval for Music Video", JOURNAL = MultMed, VOLUME = "12", YEAR = "2010", NUMBER = "6", PAGES = "510-522", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200859"} @article{bb205754, AUTHOR = "Zhang, S.L. and Tian, Q. and Hua, G. and Huang, Q.M. and Gao, W.", TITLE = "Generating Descriptive Visual Words and Visual Phrases for Large-Scale Image Applications", JOURNAL = IP, VOLUME = "20", YEAR = "2011", NUMBER = "9", MONTH = "September", PAGES = "2664-2677", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200860"} @article{bb205755, AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.", TITLE = "USB: Ultrashort Binary Descriptor for Fast Visual Matching and Retrieval", JOURNAL = IP, VOLUME = "23", YEAR = "2014", NUMBER = "8", MONTH = "August", PAGES = "3671-3683", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200861"} @article{bb205756, AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.", TITLE = "Cascade Category-Aware Visual Search", JOURNAL = IP, VOLUME = "23", YEAR = "2014", NUMBER = "6", MONTH = "June", PAGES = "2514-2527", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200862"} @article{bb205757, AUTHOR = "Irie, G. and Satou, T. and Kojima, A. and Yamasaki, T. and Aizawa, K.", TITLE = "Affective Audio-Visual Words and Latent Topic Driving Model for Realizing Movie Affective Scene Classification", JOURNAL = MultMed, VOLUME = "12", YEAR = "2010", NUMBER = "6", PAGES = "523-535", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200863"} @article{bb205758, AUTHOR = "Ibrahim, Z.A. and Ferrane, I. and Joly, P.", TITLE = "A Similarity-Based Approach for Audiovisual Document Classification Using Temporal Relation Analysis", JOURNAL = JIVP, VOLUME = "2011", YEAR = "2011", NUMBER = "2011", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200864"} @inproceedings{bb205759, AUTHOR = "Philippeau, J. and Pinquier, J. and Joly, P. and Carrive, J.", TITLE = "Dynamic organization of audiovisual database using a user-defined similarity measure based on low-level features", BOOKTITLE = ICIP08, YEAR = "2008", PAGES = "33-36", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200865"} @inproceedings{bb205760, AUTHOR = "Haidar, S. and Joly, P. and Chebaro, B.", TITLE = "Style Similarity Measure for Video Documents Comparison", BOOKTITLE = CIVR05, YEAR = "2005", PAGES = "307-317", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200866"} @article{bb205761, AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.", TITLE = "Content-Based Analysis Improves Audiovisual Archive Retrieval", JOURNAL = MultMed, VOLUME = "14", YEAR = "2012", NUMBER = "4", PAGES = "1166-1178", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200867"} @inproceedings{bb205762, AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.", TITLE = "Today's and tomorrow's retrieval practice in the audiovisual archive", BOOKTITLE = CIVR10, YEAR = "2010", PAGES = "18-25", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200868"} @inproceedings{bb205763, AUTHOR = "Huurnink, B. and de Rijke, M.", TITLE = "The value of stories for speech-based video search", BOOKTITLE = CIVR07, YEAR = "2007", PAGES = "266-271", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200869"} @article{bb205764, AUTHOR = "Jhuo, I.H. and Ye, G.N. and Gao, S.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.", TITLE = "Discovering joint audio-visual codewords for video event detection", JOURNAL = MVA, VOLUME = "25", YEAR = "2014", NUMBER = "1", MONTH = "January", PAGES = "33-47", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200870"} @inproceedings{bb205765, AUTHOR = "Ye, G.N. and Jhuo, I.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.", TITLE = "Joint audio-visual bi-modal codewords for video event detection", BOOKTITLE = ICMR12, YEAR = "2012", PAGES = "39", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200871"} @article{bb205766, AUTHOR = "Feki, I. and Ben Ammar, A. and Alimi, A.M.", TITLE = "Automatic environmental sound concepts discovery for video retrieval", JOURNAL = MultInfoRetr, VOLUME = "5", YEAR = "2016", NUMBER = "2", MONTH = "June", PAGES = "105-115", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200872"} @article{bb205767, AUTHOR = "Khan, M.U.G. and Gotoh, Y.", TITLE = "Generating natural language tags for video information management", JOURNAL = MVA, VOLUME = "28", YEAR = "2017", NUMBER = "3-4", MONTH = "May", PAGES = "243-265", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200873"} @inproceedings{bb205768, AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.", TITLE = "Generating coherent natural language annotations for video streams", BOOKTITLE = ICIP12, YEAR = "2012", PAGES = "2893-2896", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200874"} @inproceedings{bb205769, AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.", TITLE = "Towards coherent natural language description of video streams", BOOKTITLE = SIG11, YEAR = "2011", PAGES = "664-671", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200875"} @inproceedings{bb205770, AUTHOR = "Zhang, L. and Khan, M.U.G. and Gotoh, Y.", TITLE = "Video scene classification based on natural language description", BOOKTITLE = ARTEMIS11, YEAR = "2011", PAGES = "942-949", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200876"} @inproceedings{bb205771, AUTHOR = "Guo, X.N. and Zhong, W. and Ye, L. and Fang, L. and Heng, Y. and Zhang, Q.", TITLE = "Global Affective Video Content Regression Based on Complementary Audio-visual Features", BOOKTITLE = MMMod20, YEAR = "2020", PAGES = "II:540-550", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200877"} @inproceedings{bb205772, AUTHOR = "Peri, D. and Sah, S. and Ptucha, R.", TITLE = "Show, Translate and Tell", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "295-299", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200878"} @inproceedings{bb205773, AUTHOR = "Chen, K. and Zhang, C.X. and Fang, C. and Wang, Z.W. and Bui, T. and Nevatia, R.", TITLE = "Visually Indicated Sound Generation by Perceptually Optimized Classification", BOOKTITLE = MultLearnApp18, YEAR = "2018", PAGES = "VI:560-574", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200879"} @inproceedings{bb205774, AUTHOR = "Haurilet, M.L. and Tapaswi, M. and Al Halah, Z. and Stiefelhagen, R.", TITLE = "Naming TV characters by watching and analyzing dialogs", BOOKTITLE = WACV16, YEAR = "2016", PAGES = "1-9", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200880"} @inproceedings{bb205775, AUTHOR = "Numano, S. and Enami, N. and Ariki, Y.", TITLE = "Task-Driven Saliency Detection on Music Video", BOOKTITLE = CV4AC14, YEAR = "2014", PAGES = "658-671", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200881"} @inproceedings{bb205776, AUTHOR = "Scott, D. and Zhang, Z.X. and Albatal, R. and McGuinness, K. and Acar, E. and Hopfgartner, F. and Gurrin, C. and O'Connor, N.E. and Smeaton, A.F.", TITLE = "Audio-Visual Classification Video Browser", BOOKTITLE = MMMod14, YEAR = "2014", PAGES = "II: 398-401", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200882"} @inproceedings{bb205777, AUTHOR = "Lin, Y.T. and Tsai, T.H. and Hu, M.C. and Cheng, W.H. and Wu, J.L.", TITLE = "Semantic Based Background Music Recommendation for Home Videos", BOOKTITLE = MMMod14, YEAR = "2014", PAGES = "II: 283-290", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200883"} @inproceedings{bb205778, AUTHOR = "Shamma, D.A. and Kennedy, L. and Churchill, E.F.", TITLE = "Watching and talking: media content as social nexus", BOOKTITLE = ICMR12, YEAR = "2012", PAGES = "12", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200884"} @inproceedings{bb205779, AUTHOR = "Nowak, S. and Paduschek, R. and Kuhhirt, U.", TITLE = "Photo summary: automated selection of representative photos from a digital collection", BOOKTITLE = ICMR11, YEAR = "2011", PAGES = "75", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200885"} @inproceedings{bb205780, AUTHOR = "Paduschek, R. and Nowak, S. and Kuhhirt, U.", TITLE = "Automated detection of errors and quality issues in audio-visual content", BOOKTITLE = ICMR11, YEAR = "2011", PAGES = "74", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200886"} @inproceedings{bb205781, AUTHOR = "Vretos, N. and Nikolaidis, N. and Pitas, I.", TITLE = "The use of Audio-Visual Description Profile in 3D video content description", BOOKTITLE = "3DTV12", YEAR = "2012", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200887"} @inproceedings{bb205782, AUTHOR = "Ta, A.P. and Ben, M. and Gravier, G.", TITLE = "Improving Cluster Selection and Event Modeling in Unsupervised Mining for Automatic Audiovisual Video Structuring", BOOKTITLE = MMMod12, YEAR = "2012", PAGES = "529-540", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200888"} @inproceedings{bb205783, AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.", TITLE = "Improving Cross-Domain Concept Detection via Object-Based Features", BOOKTITLE = CAIP15, YEAR = "2015", PAGES = "II:359-370", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200889"} @inproceedings{bb205784, AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.", TITLE = "On the Spatial Extents of SIFT Descriptors for Visual Concept Detection", BOOKTITLE = CVS11, YEAR = "2011", PAGES = "71-80", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200890"} @inproceedings{bb205785, AUTHOR = "Muhling, M. and Ewerth, R. and Zhou, J. and Freisleben, B.", TITLE = "Multimodal Video Concept Detection via Bag of Auditory Words and Multiple Kernel Learning", BOOKTITLE = MMMod12, YEAR = "2012", PAGES = "40-50", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200891"} @inproceedings{bb205786, AUTHOR = "Valio, F.B. and Pedrini, H. and Leite, N.J.", TITLE = "Fast Rotation-Invariant Video Caption Detection Based on Visual Rhythm", BOOKTITLE = CIARP11, YEAR = "2011", PAGES = "157-164", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200892"} @inproceedings{bb205787, AUTHOR = "Gianni, F. and Pinquier, J. and Irisa, E.K.", TITLE = "ACADI showcase: Automatic character indexing in audiovisual document", BOOKTITLE = CIVR07, YEAR = "2007", PAGES = "109-112", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200893"} @inproceedings{bb205788, AUTHOR = "Putthividhy, D. and Attias, H.T. and Nagarajan, S.S.", TITLE = "Topic regression multi-modal Latent Dirichlet Allocation for image annotation", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "3408-3415", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200894"} @inproceedings{bb205789, AUTHOR = "Jung, K.H. and Choi, S.H. and Kim, H.S. and Hur, N.H. and Kim, J.K.", TITLE = "Caption insertion method for 3D broadcasting service", BOOKTITLE = "3DTV10", YEAR = "2010", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200895"} @inproceedings{bb205790, AUTHOR = "Pramod, S.K. and Jawahar, C.V. and Zisserman, A.", TITLE = "Subtitle-free Movie to Script Alignment", BOOKTITLE = BMVC09, YEAR = "2009", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200896"} @inproceedings{bb205791, AUTHOR = "Zeng, Z. and Liang, W. and Li, H.P. and Zhang, S.W.", TITLE = "A Novel Video Classification Method Based on Hybrid Generative/Discriminative Models", BOOKTITLE = SSPR08, YEAR = "2008", PAGES = "705-713", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200897"} @inproceedings{bb205792, AUTHOR = "Zhu, Y.Y. and Ming, Z. and Huang, Q.A.", TITLE = "SVM-Based Audio Classification for Content- Based Multimedia Retrieval", BOOKTITLE = MCAM07, YEAR = "2007", PAGES = "474-482", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200898"} @inproceedings{bb205793, AUTHOR = "Goldmann, L. and Samour, A. and Karaman, M. and Sikora, T.", TITLE = "Extracting High Level Semantics by Means of Speech, Audio, and Image Primitives in Surveillance Applications", BOOKTITLE = ICIP06, YEAR = "2006", PAGES = "2397-2400", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200899"} @inproceedings{bb205794, AUTHOR = "Luo, J. and Caputo, B. and Zweig, A. and Bach, J.H. and Anemuller, J.", TITLE = "Object Category Detection Using Audio-Visual Cues", BOOKTITLE = CVS08, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200900"} @inproceedings{bb205795, AUTHOR = "Caputo, B. and Wallraven, C. and Nilsback, M.E.", TITLE = "Object categorization via local kernels", BOOKTITLE = ICPR04, YEAR = "2004", PAGES = "II: 132-135", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200901"} @inproceedings{bb205796, AUTHOR = "Schauer, C. and Gross, H.M.", TITLE = "A Computational Model of Early Auditory-Visual Integration", BOOKTITLE = DAGM03, YEAR = "2003", PAGES = "362-369", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200902"} @inproceedings{bb205797, AUTHOR = "Fu, T.Y. and Liu, X.X. and Liang, L.H. and Pi, X.B. and Nefian, A.V.", TITLE = "A audio-visual speaker identification using coupled hidden Markov models", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "III: 29-32", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200903"} @inproceedings{bb205798, AUTHOR = "Yemez, Y. and Kanak, A. and Erzin, E. and Tekalp, A.M.", TITLE = "Multimodal speaker identification with audio-video processing", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "III: 5-8", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200904"} @inproceedings{bb205799, AUTHOR = "Sugano, M. and Isaksson, R. and Nakajima, Y. and Yanagihara, H.", TITLE = "Shot genre classification using compressed audio-visual features", BOOKTITLE = ICIP03, YEAR = "2003", PAGES = "II: 17-20", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT200905"}