@inproceedings{bb241500,
        AUTHOR = "Bai, H.L. and Wang, L. and Qin, G. and Zhang, J.W. and Tao, K. and Chang, X.F. and Dong, Y.",
        TITLE = "TV Program Segmentation using Multi-Modal Information Fusion",
        BOOKTITLE = ICMR11,
        YEAR = "2011",
        PAGES = "11",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236407"}

@inproceedings{bb241501,
        AUTHOR = "Xu, C.L. and Xiong, C.M. and Corso, J.J.",
        TITLE = "Streaming Hierarchical Video Segmentation",
        BOOKTITLE = ECCV12,
        YEAR = "2012",
        PAGES = "VI: 626-639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236408"}

@inproceedings{bb241502,
        AUTHOR = "Kowdle, A. and Chen, T.H.",
        TITLE = "Learning to Segment a Video to Clips Based on Scene and Camera Motion",
        BOOKTITLE = ECCV12,
        YEAR = "2012",
        PAGES = "III: 272-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236409"}

@inproceedings{bb241503,
        AUTHOR = "Choi, Y.H. and Kang, S.W. and Choi, I.",
        TITLE = "TV program segmentation using text-visual analysis",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "1473-1476",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236410"}

@inproceedings{bb241504,
        AUTHOR = "Gao, Y. and Wang, T. and Li, J.G. and Du, Y.Z. and Hu, W. and Zhang, Y.M. and Ai, H.Z.",
        TITLE = "Cast indexing for videos by NCuts and page ranking",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "441-447",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236411"}

@inproceedings{bb241505,
        AUTHOR = "Ding, D.Y. and Zhang, B.",
        TITLE = "Probabilistic model supported rank aggregation for the semantic concept
detection in video",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "587-594",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236412"}

@inproceedings{bb241506,
        AUTHOR = "Filip, J. and Haindl, M.",
        TITLE = "Fast and reliable PCA-based temporal segmentation of video sequences",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236413"}

@inproceedings{bb241507,
        AUTHOR = "Liu, S.Y. and Dong, G. and Yan, C.H. and Ong, S.H.",
        TITLE = "Video segmentation:
Propagation, validation and aggregation of a preceding graph",
        BOOKTITLE = CVPR08,
        YEAR = "2008",
        PAGES = "1-7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236414"}

@inproceedings{bb241508,
        AUTHOR = "Wu, W.X. and Li, J.G. and Wang, T. and Zhang, Y.M.",
        TITLE = "Markov chain local binary pattern and its application to video concept
detection",
        BOOKTITLE = ICIP08,
        YEAR = "2008",
        PAGES = "2524-2527",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236415"}

@inproceedings{bb241509,
        AUTHOR = "Wang, P.P. and Wang, T. and Li, J.G. and Zhang, Y.M.",
        TITLE = "Information-Theoretic Content Selection for Automated Home Video
Editing",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "IV: 537-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236416"}

@inproceedings{bb241510,
        AUTHOR = "Abdollahian, G. and Delp, E.J.",
        TITLE = "Finding Regions of Interest in Home Videos Based on Camera Motion",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "IV: 545-548",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236417"}

@inproceedings{bb241511,
        AUTHOR = "Geng, Y.L. and Xu, D. and Feng, S.H. and Yuan, J.Z.",
        TITLE = "A Robust and Hierarchical Approach for Camera Motion Classification",
        BOOKTITLE = SSPR06,
        YEAR = "2006",
        PAGES = "340-348",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236418"}

@inproceedings{bb241512,
        AUTHOR = "Cheung, S.C.S. and Nguyen, T.P.",
        TITLE = "Mining Arbitrary-Length Repeated Patterns in Television Broadcast",
        BOOKTITLE = ICIP05,
        YEAR = "2005",
        PAGES = "III: 181-184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236419"}

@inproceedings{bb241513,
        AUTHOR = "Gillespie, W.J. and Nguyen, D.T.",
        TITLE = "Video Classification Using a Tree-Based RBF Network",
        BOOKTITLE = ICIP05,
        YEAR = "2005",
        PAGES = "III: 465-468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236420"}

@inproceedings{bb241514,
        AUTHOR = "Tweed, D. and Fisher, R.B. and Bins, J. and List, T.",
        TITLE = "Efficient Hidden Semi-Markov Model Inference for Structured Video
Sequences",
        BOOKTITLE = PETS05,
        YEAR = "2005",
        PAGES = "247-254",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236421"}

@inproceedings{bb241515,
        AUTHOR = "Leung, R. and Taubman, D.S.",
        TITLE = "Impact of Motion on the Random Access Efficiency of Scalable Compressed
Video",
        BOOKTITLE = ICIP05,
        YEAR = "2005",
        PAGES = "III: 169-172",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236422"}

@inproceedings{bb241516,
        AUTHOR = "Divakaran, A. and Vetro, A. and Sun, H.F.",
        TITLE = "Method for representing and comparing multimedia 
content according to rank",
        BOOKTITLE = US_Patent,
        YEAR = "2008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236423"}

@inproceedings{bb241517,
        AUTHOR = "Xie, L.X. and Chang, S.F. and Divakaran, A. and Sun, H.F.",
        TITLE = "Mining Statistical Video Structures",
        BOOKTITLE = VideoMining03,
        YEAR = "2003",
        PAGES = "Chapter 10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236424"}

@inproceedings{bb241518,
        AUTHOR = "Samson, V. and Bouthemy, P.",
        TITLE = "Learning classes for video interpretation with a robust parallel
clustering method",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "IV: 569-572",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236425"}

@inproceedings{bb241519,
        AUTHOR = "Satoh, S.",
        TITLE = "Generalized Histogram: Empirical Optimization of Low Dimensional
Features for Image Matching",
        BOOKTITLE = ECCV04,
        YEAR = "2004",
        PAGES = "Vol III: 210-223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236426"}

@inproceedings{bb241520,
        AUTHOR = "Park, S. and Golshani, P.",
        TITLE = "Video Composition and Retrieval",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "TP11",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236427"}

@inproceedings{bb241521,
        AUTHOR = "Loui, A.C. and Savakis, A.E.",
        TITLE = "Automatic image event segmentation and quality screening for albuming
applications",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "TP10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236428"}

@inproceedings{bb241522,
        AUTHOR = "Kurokawa, M.",
        TITLE = "Representation and Retrieval of Video Scene by Using Object Actions and
Their Spatio-temporal Relationships",
        BOOKTITLE = ICIP99,
        YEAR = "1999",
        PAGES = "II:86-90",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236429"}

@inproceedings{bb241523,
        AUTHOR = "Vinod, V.V.",
        TITLE = "Activity Based Video Shot Retrieval and Ranking",
        BOOKTITLE = ICPR98,
        YEAR = "1998",
        PAGES = "Vol I: 682-684",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236430"}

@article{bb241524,
        AUTHOR = "Swanberg, D. and Shu, C.F. and Jain, R.C.",
        TITLE = "Knowledge-Guided Parsing in Video Databases",
        JOURNAL = SPIE,
        VOLUME = "1908",
        YEAR = "1993",
        MONTH = "February",
        PAGES = "13-24",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat822.html#TT236431"}

@article{bb241525,
        AUTHOR = "Saraceno, C. and Leonardi, R.",
        TITLE = "Indexing audiovisual databases through joint audio and video processing",
        JOURNAL = IJIST,
        VOLUME = "9",
        YEAR = "1999",
        NUMBER = "5",
        PAGES = "320-331",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236432"}

@inproceedings{bb241526,
        AUTHOR = "Saraceno, C. and Leonardi, R.",
        TITLE = "Identification of Successive Correlated Camera Shots Using Audio
and Video Information",
        BOOKTITLE = ICIP97,
        YEAR = "1997",
        PAGES = "III: 166-169",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236433"}

@inproceedings{bb241527,
        AUTHOR = "Saraceno, C. and Leonardi, R.",
        TITLE = "Audio-visual processing for scene change detection",
        BOOKTITLE = CIAP97,
        YEAR = "1997",
        PAGES = "II: 124-131",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236434"}

@article{bb241528,
        AUTHOR = "Li, D.G. and Sethi, I.K. and Dimitrova, N. and McGee, T.",
        TITLE = "Classification of general audio data for content-based retrieval",
        JOURNAL = PRL,
        VOLUME = "22",
        YEAR = "2001",
        NUMBER = "5",
        MONTH = "April",
        PAGES = "533-544",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236435"}

@article{bb241529,
        AUTHOR = "Tsekeridou, S. and Pitas, I.",
        TITLE = "Content-based video parsing and indexing based on audio-visual
interaction",
        JOURNAL = CirSysVideo,
        VOLUME = "11",
        YEAR = "2001",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "522-535",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236436"}

@inproceedings{bb241530,
        AUTHOR = "Tsekeridou, S. and Pitas, I.",
        TITLE = "Speaker dependent video indexing based on audio-visual interaction",
        BOOKTITLE = ICIP98,
        YEAR = "1998",
        PAGES = "I: 358-362",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236437"}

@inproceedings{bb241531,
        AUTHOR = "Tsekeridou, S. and Krinidis, S. and Pitas, I.",
        TITLE = "Scene Change Detection Based on Audio-Visual Analysis and Interaction",
        BOOKTITLE = "WTRCV01",
        YEAR = "2001",
        PAGES = "214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236438"}

@article{bb241532,
        AUTHOR = "Kyperountas, M. and Kotropoulos, C. and Pitas, I.",
        TITLE = "Enhanced Eigen-Audioframes for Audiovisual Scene Change Detection",
        JOURNAL = MultMed,
        VOLUME = "9",
        YEAR = "2007",
        NUMBER = "4",
        PAGES = "785-797",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236439"}

@article{bb241533,
        AUTHOR = "Gauvain, J.L. and Lamel, L. and Adda, G.",
        TITLE = "Audio Partitioning and Transcription for Broadcast Data Indexation",
        JOURNAL = MultToolApp,
        VOLUME = "14",
        YEAR = "2001",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "187-200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236440"}

@article{bb241534,
        AUTHOR = "Amir, A. and Srinivasan, S. and Efrat, A.",
        TITLE = "Search the Audio, Browse the Video:
A Generic Paradigm for Video Collections",
        JOURNAL = JASP,
        VOLUME = "2003",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "209",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236441"}

@article{bb241535,
        AUTHOR = "Beal, M.J. and Jojic, N. and Attias, H.T.",
        TITLE = "A graphical model for audiovisual object tracking",
        JOURNAL = PAMI,
        VOLUME = "25",
        YEAR = "2003",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "828-836",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236442"}

@inproceedings{bb241536,
        AUTHOR = "Beal, M.J. and Attias, H.T. and Jojic, N.",
        TITLE = "Audio-Video Sensor Fusion with Probabilistic Graphical Models",
        BOOKTITLE = ECCV02,
        YEAR = "2002",
        PAGES = "I: 736 ff.",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236443"}

@inproceedings{bb241537,
        AUTHOR = "Wu, P. and Li, Y. and Tretter, D.",
        TITLE = "Scalable video summarization",
        BOOKTITLE = US_Patent,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236444"}

@article{bb241538,
        AUTHOR = "Gong, Y.H.",
        TITLE = "Summarizing Audiovisual Contents of a Video Program",
        JOURNAL = JASP,
        VOLUME = "2003",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "160",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236445"}

@inproceedings{bb241539,
        AUTHOR = "Gong, Y.H. and Liu, X.",
        TITLE = "Method and system for segmentation, classification, and summarization
of video images",
        BOOKTITLE = US_Patent,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236446"}

@inproceedings{bb241540,
        AUTHOR = "Liu, X. and Gong, Y.H.",
        TITLE = "Method and system for segmentation, classification, and summarization
of video images",
        BOOKTITLE = US_Patent,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236446"}

@inproceedings{bb241541,
        AUTHOR = "Gong, Y.H. and Liu, X.",
        TITLE = "Creating audio-centric, image-centric, 
and integrated audio-visual summaries",
        BOOKTITLE = US_Patent,
        YEAR = "2005",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236447"}

@inproceedings{bb241542,
        AUTHOR = "Gong, Y.H. and Liu, X.",
        TITLE = "Video Summarization using Singular Value Decomposition",
        BOOKTITLE = CVPR00,
        YEAR = "2000",
        PAGES = "II: 174-180",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236448"}

@inproceedings{bb241543,
        AUTHOR = "Gong, Y.H. and Liu, X.",
        TITLE = "Video Shot Segmentation and Classification",
        BOOKTITLE = ICPR00,
        YEAR = "2000",
        PAGES = "Vol I: 860-863",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236449"}

@article{bb241544,
        AUTHOR = "Wang, H.L. and Divakaran, A. and Vetro, A. and Chang, S.F. and Sun, H.F.",
        TITLE = "Survey of compressed-domain features used in audio-visual indexing and
analysis",
        JOURNAL = JVCIR,
        VOLUME = "14",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "150-183",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236450"}

@article{bb241545,
        AUTHOR = "Naphade, M.R.",
        TITLE = "On supervision and statistical learning for semantic multimedia
analysis",
        JOURNAL = JVCIR,
        VOLUME = "15",
        YEAR = "2004",
        NUMBER = "3",
        MONTH = "September",
        PAGES = "348-369",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236451"}

@article{bb241546,
        AUTHOR = "Naphade, M.R. and Kozintsev, I.V. and Huang, T.S.",
        TITLE = "A factor graph framework for semantic video indexing",
        JOURNAL = CirSysVideo,
        VOLUME = "12",
        YEAR = "2002",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "40-52",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236452"}

@inproceedings{bb241547,
        AUTHOR = "Naphade, M.R. and Kozintsev, I.V. and Huang, T.S. and Ramchandran, K.",
        TITLE = "A factor graph framework for semantic indexing and retrieval in video",
        BOOKTITLE = CBAIVL00,
        YEAR = "2000",
        PAGES = "35-39",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236453"}

@inproceedings{bb241548,
        AUTHOR = "Naphade, M.R. and Huang, T.S.",
        TITLE = "Detecting Semantic Concepts Using Context and Audio/Visual Features",
        BOOKTITLE = EventVideo01,
        YEAR = "2001",
        PAGES = "92-98",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236454"}

@inproceedings{bb241549,
        AUTHOR = "Naphade, M.R. and Huang, T.S.",
        TITLE = "Recognizing High-level Audio-visual Concepts Using Context",
        BOOKTITLE = ICIP01,
        YEAR = "2001",
        PAGES = "III: 46-49",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236455"}

@inproceedings{bb241550,
        AUTHOR = "Naphade, M.R. and Huang, T.S.",
        TITLE = "Semantic Video Indexing Using a Probabilistic Framework",
        BOOKTITLE = ICPR00,
        YEAR = "2000",
        PAGES = "Vol III: 79-84",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236456"}

@inproceedings{bb241551,
        AUTHOR = "Naphade, M.R. and Huang, T.S.",
        TITLE = "A Probabilistic Framework for Semantic Indexing and Retrieval in Video",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "MP9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236457"}

@inproceedings{bb241552,
        AUTHOR = "Naphade, M.R. and Huang, T.S.",
        TITLE = "Inferring Semantic Concepts for Video Indexing and Retrieval",
        BOOKTITLE = ICIP00,
        YEAR = "2000",
        PAGES = "Vol III: 766-769",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236458"}

@inproceedings{bb241553,
        AUTHOR = "Naphade, M.R. and Kristjansson, T. and Frey, B.J. and Huang, T.S.",
        TITLE = "Probabilistic multimedia objects (multijects): a novel approach to
video indexing and retrieval in multimedia systems",
        BOOKTITLE = ICIP98,
        YEAR = "1998",
        PAGES = "III: 536-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236459"}

@article{bb241554,
        AUTHOR = "Xie, X. and Lu, L. and Jia, M. and Li, H. and Seide, F. and Ma, W.Y.",
        TITLE = "Mobile Search With Multimodal Queries",
        JOURNAL = PIEEE,
        VOLUME = "96",
        YEAR = "2008",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "589-601",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236460"}

@article{bb241555,
        AUTHOR = "Kiranyaz, S. and Gabbouj, M.",
        TITLE = "Generic content-based audio indexing and retrieval framework",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "3",
        MONTH = "June",
        PAGES = "285-297",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236461"}

@article{bb241556,
        AUTHOR = "Monaci, G. and Jost, P. and Vandergheynst, P. and Mailhe, B. and Lesage, S. and Gribonval, R.",
        TITLE = "Learning Multimodal Dictionaries",
        JOURNAL = IP,
        VOLUME = "16",
        YEAR = "2007",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2272-2283",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236462"}

@inproceedings{bb241557,
        AUTHOR = "Zhang, T.",
        TITLE = "Using background audio change detection for segmenting video",
        BOOKTITLE = US_Patent,
        YEAR = "2007",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236463"}

@article{bb241558,
        AUTHOR = "Kotti, M. and Ververidis, D. and Evangelopoulos, G. and Panagakis, I. and Kotropoulos, C. and Maragos, P. and Pitas, I.",
        TITLE = "Audio-Assisted Movie Dialogue Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "18",
        YEAR = "2008",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "1618-1627",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236464"}

@article{bb241559,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Visual Event Recognition in Surveillance Video Sequences",
        JOURNAL = MultMed,
        VOLUME = "9",
        YEAR = "2007",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "257-267",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236465"}

@inproceedings{bb241560,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Visual Foreground Extraction for Event Characterization",
        BOOKTITLE = SLAM06,
        YEAR = "2006",
        PAGES = "116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236466"}

@inproceedings{bb241561,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Video Integration for Background Modelling",
        BOOKTITLE = ECCV04,
        YEAR = "2004",
        PAGES = "Vol II: 202-213",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236467"}

@article{bb241562,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Liu, M. and Huang, T.S. and Pianfetti, B. and Roth, D. and Levinson, S.",
        TITLE = "Audio-Visual Affect Recognition",
        JOURNAL = MultMed,
        VOLUME = "9",
        YEAR = "2007",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "424-428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236468"}

@article{bb241563,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B.M. and Huang, T.S.",
        TITLE = "Audio-Visual Affective Expression Recognition Through Multistream Fused
HMM",
        JOURNAL = MultMed,
        VOLUME = "10",
        YEAR = "2008",
        NUMBER = "4",
        MONTH = "June",
        PAGES = "570-577",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236469"}

@inproceedings{bb241564,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B. and Liu, M. and Zhang, T. and Zhang, Z.Q. and Huang, T.S. and Levinson, S.",
        TITLE = "Audio-Visual Affect Recognition through Multi-Stream Fused HMM for HCI",
        BOOKTITLE = CVPR05,
        YEAR = "2005",
        PAGES = "II: 967-972",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236470"}

@article{bb241565,
        AUTHOR = "Zhang, S.L. and Huang, Q.M. and Jiang, S. and Gao, W. and Tian, Q.",
        TITLE = "Affective Visualization and Retrieval for Music Video",
        JOURNAL = MultMed,
        VOLUME = "12",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "510-522",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236471"}

@article{bb241566,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Hua, G. and Huang, Q.M. and Gao, W.",
        TITLE = "Generating Descriptive Visual Words and Visual Phrases for Large-Scale
Image Applications",
        JOURNAL = IP,
        VOLUME = "20",
        YEAR = "2011",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2664-2677",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236472"}

@article{bb241567,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.",
        TITLE = "USB: Ultrashort Binary Descriptor for Fast Visual Matching and
Retrieval",
        JOURNAL = IP,
        VOLUME = "23",
        YEAR = "2014",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3671-3683",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236473"}

@article{bb241568,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.",
        TITLE = "Cascade Category-Aware Visual Search",
        JOURNAL = IP,
        VOLUME = "23",
        YEAR = "2014",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "2514-2527",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236474"}

@article{bb241569,
        AUTHOR = "Irie, G. and Satou, T. and Kojima, A. and Yamasaki, T. and Aizawa, K.",
        TITLE = "Affective Audio-Visual Words and Latent Topic Driving Model for
Realizing Movie Affective Scene Classification",
        JOURNAL = MultMed,
        VOLUME = "12",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "523-535",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236475"}

@article{bb241570,
        AUTHOR = "Ibrahim, Z.A. and Ferrane, I. and Joly, P.",
        TITLE = "A Similarity-Based Approach for Audiovisual Document Classification
Using Temporal Relation Analysis",
        JOURNAL = JIVP,
        VOLUME = "2011",
        YEAR = "2011",
        NUMBER = "2011",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236476"}

@inproceedings{bb241571,
        AUTHOR = "Philippeau, J. and Pinquier, J. and Joly, P. and Carrive, J.",
        TITLE = "Dynamic organization of audiovisual database using a user-defined
similarity measure based on low-level features",
        BOOKTITLE = ICIP08,
        YEAR = "2008",
        PAGES = "33-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236477"}

@inproceedings{bb241572,
        AUTHOR = "Haidar, S. and Joly, P. and Chebaro, B.",
        TITLE = "Style Similarity Measure for Video Documents Comparison",
        BOOKTITLE = CIVR05,
        YEAR = "2005",
        PAGES = "307-317",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236478"}

@article{bb241573,
        AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.",
        TITLE = "Content-Based Analysis Improves Audiovisual Archive Retrieval",
        JOURNAL = MultMed,
        VOLUME = "14",
        YEAR = "2012",
        NUMBER = "4",
        PAGES = "1166-1178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236479"}

@inproceedings{bb241574,
        AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.",
        TITLE = "Today's and tomorrow's retrieval practice in the audiovisual archive",
        BOOKTITLE = CIVR10,
        YEAR = "2010",
        PAGES = "18-25",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236480"}

@inproceedings{bb241575,
        AUTHOR = "Huurnink, B. and de Rijke, M.",
        TITLE = "The value of stories for speech-based video search",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "266-271",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236481"}

@article{bb241576,
        AUTHOR = "Jhuo, I.H. and Ye, G.N. and Gao, S.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.",
        TITLE = "Discovering joint audio-visual codewords for video event detection",
        JOURNAL = MVA,
        VOLUME = "25",
        YEAR = "2014",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "33-47",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236482"}

@inproceedings{bb241577,
        AUTHOR = "Ye, G.N. and Jhuo, I.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.",
        TITLE = "Joint audio-visual bi-modal codewords for video event detection",
        BOOKTITLE = ICMR12,
        YEAR = "2012",
        PAGES = "39",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236483"}

@article{bb241578,
        AUTHOR = "Feki, I. and Ben Ammar, A. and Alimi, A.M.",
        TITLE = "Automatic environmental sound concepts discovery for video retrieval",
        JOURNAL = MultInfoRetr,
        VOLUME = "5",
        YEAR = "2016",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "105-115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236484"}

@article{bb241579,
        AUTHOR = "Khan, M.U.G. and Gotoh, Y.",
        TITLE = "Generating natural language tags for video information management",
        JOURNAL = MVA,
        VOLUME = "28",
        YEAR = "2017",
        NUMBER = "3-4",
        MONTH = "May",
        PAGES = "243-265",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236485"}

@inproceedings{bb241580,
        AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.",
        TITLE = "Generating coherent natural language annotations for video streams",
        BOOKTITLE = ICIP12,
        YEAR = "2012",
        PAGES = "2893-2896",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236486"}

@inproceedings{bb241581,
        AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.",
        TITLE = "Towards coherent natural language description of video streams",
        BOOKTITLE = SIG11,
        YEAR = "2011",
        PAGES = "664-671",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236487"}

@inproceedings{bb241582,
        AUTHOR = "Zhang, L. and Khan, M.U.G. and Gotoh, Y.",
        TITLE = "Video scene classification based on natural language description",
        BOOKTITLE = ARTEMIS11,
        YEAR = "2011",
        PAGES = "942-949",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236488"}

@inproceedings{bb241583,
        AUTHOR = "Guo, X.N. and Zhong, W. and Ye, L. and Fang, L. and Heng, Y. and Zhang, Q.",
        TITLE = "Global Affective Video Content Regression Based on Complementary
Audio-visual Features",
        BOOKTITLE = MMMod20,
        YEAR = "2020",
        PAGES = "II:540-550",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236489"}

@inproceedings{bb241584,
        AUTHOR = "Peri, D. and Sah, S. and Ptucha, R.",
        TITLE = "Show, Translate and Tell",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "295-299",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236490"}

@inproceedings{bb241585,
        AUTHOR = "Chen, K. and Zhang, C.X. and Fang, C. and Wang, Z.W. and Bui, T. and Nevatia, R.",
        TITLE = "Visually Indicated Sound Generation by Perceptually Optimized
Classification",
        BOOKTITLE = MultLearnApp18,
        YEAR = "2018",
        PAGES = "VI:560-574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236491"}

@inproceedings{bb241586,
        AUTHOR = "Haurilet, M.L. and Tapaswi, M. and Al Halah, Z. and Stiefelhagen, R.",
        TITLE = "Naming TV characters by watching and analyzing dialogs",
        BOOKTITLE = WACV16,
        YEAR = "2016",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236492"}

@inproceedings{bb241587,
        AUTHOR = "Numano, S. and Enami, N. and Ariki, Y.",
        TITLE = "Task-Driven Saliency Detection on Music Video",
        BOOKTITLE = CV4AC14,
        YEAR = "2014",
        PAGES = "658-671",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236493"}

@inproceedings{bb241588,
        AUTHOR = "Scott, D. and Zhang, Z.X. and Albatal, R. and McGuinness, K. and Acar, E. and Hopfgartner, F. and Gurrin, C. and O'Connor, N.E. and Smeaton, A.F.",
        TITLE = "Audio-Visual Classification Video Browser",
        BOOKTITLE = MMMod14,
        YEAR = "2014",
        PAGES = "II: 398-401",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236494"}

@inproceedings{bb241589,
        AUTHOR = "Lin, Y.T. and Tsai, T.H. and Hu, M.C. and Cheng, W.H. and Wu, J.L.",
        TITLE = "Semantic Based Background Music Recommendation for Home Videos",
        BOOKTITLE = MMMod14,
        YEAR = "2014",
        PAGES = "II: 283-290",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236495"}

@inproceedings{bb241590,
        AUTHOR = "Shamma, D.A. and Kennedy, L. and Churchill, E.F.",
        TITLE = "Watching and talking: media content as social nexus",
        BOOKTITLE = ICMR12,
        YEAR = "2012",
        PAGES = "12",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236496"}

@inproceedings{bb241591,
        AUTHOR = "Nowak, S. and Paduschek, R. and Kuhhirt, U.",
        TITLE = "Photo summary: automated selection of representative photos from a
digital collection",
        BOOKTITLE = ICMR11,
        YEAR = "2011",
        PAGES = "75",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236497"}

@inproceedings{bb241592,
        AUTHOR = "Paduschek, R. and Nowak, S. and Kuhhirt, U.",
        TITLE = "Automated detection of errors and quality issues in audio-visual
content",
        BOOKTITLE = ICMR11,
        YEAR = "2011",
        PAGES = "74",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236498"}

@inproceedings{bb241593,
        AUTHOR = "Vretos, N. and Nikolaidis, N. and Pitas, I.",
        TITLE = "The use of Audio-Visual Description Profile in 3D video content
description",
        BOOKTITLE = "3DTV12",
        YEAR = "2012",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236499"}

@inproceedings{bb241594,
        AUTHOR = "Ta, A.P. and Ben, M. and Gravier, G.",
        TITLE = "Improving Cluster Selection and Event Modeling in Unsupervised Mining
for Automatic Audiovisual Video Structuring",
        BOOKTITLE = MMMod12,
        YEAR = "2012",
        PAGES = "529-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236500"}

@inproceedings{bb241595,
        AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.",
        TITLE = "Improving Cross-Domain Concept Detection via Object-Based Features",
        BOOKTITLE = CAIP15,
        YEAR = "2015",
        PAGES = "II:359-370",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236501"}

@inproceedings{bb241596,
        AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.",
        TITLE = "On the Spatial Extents of SIFT Descriptors for Visual Concept Detection",
        BOOKTITLE = CVS11,
        YEAR = "2011",
        PAGES = "71-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236502"}

@inproceedings{bb241597,
        AUTHOR = "Muhling, M. and Ewerth, R. and Zhou, J. and Freisleben, B.",
        TITLE = "Multimodal Video Concept Detection via Bag of Auditory Words and
Multiple Kernel Learning",
        BOOKTITLE = MMMod12,
        YEAR = "2012",
        PAGES = "40-50",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236503"}

@inproceedings{bb241598,
        AUTHOR = "Valio, F.B. and Pedrini, H. and Leite, N.J.",
        TITLE = "Fast Rotation-Invariant Video Caption Detection Based on Visual Rhythm",
        BOOKTITLE = CIARP11,
        YEAR = "2011",
        PAGES = "157-164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236504"}

@inproceedings{bb241599,
        AUTHOR = "Gianni, F. and Pinquier, J. and Irisa, E.K.",
        TITLE = "ACADI showcase: Automatic character indexing in audiovisual document",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "109-112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT236505"}

Last update:Oct 6, 2025 at 14:07:43