@article{bb162000,
        AUTHOR = "Matos, N. and Pereira, F.",
        TITLE = "Automatic creation and evaluation of MPEG-7 compliant summary
descriptions for generic audiovisual content",
        JOURNAL = SP:IC,
        VOLUME = "23",
        YEAR = "2008",
        NUMBER = "8",
        MONTH = "September",
        PAGES = "581-598",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157463"}

@article{bb162001,
        AUTHOR = "Kiranyaz, S. and Gabbouj, M.",
        TITLE = "Generic content-based audio indexing and retrieval framework",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "3",
        MONTH = "June",
        PAGES = "285-297",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157464"}

@article{bb162002,
        AUTHOR = "Monaci, G. and Jost, P. and Vandergheynst, P. and Mailhe, B. and Lesage, S. and Gribonval, R.",
        TITLE = "Learning Multimodal Dictionaries",
        JOURNAL = IP,
        VOLUME = "16",
        YEAR = "2007",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2272-2283",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157465"}

@inproceedings{bb162003,
        AUTHOR = "Zhang, T.",
        TITLE = "Using background audio change detection for segmenting video",
        BOOKTITLE = US_Patent,
        YEAR = "2007",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157466"}

@article{bb162004,
        AUTHOR = "Kotti, M. and Ververidis, D. and Evangelopoulos, G. and Panagakis, I. and Kotropoulos, C. and Maragos, P. and Pitas, I.",
        TITLE = "Audio-Assisted Movie Dialogue Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "18",
        YEAR = "2008",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "1618-1627",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157467"}

@article{bb162005,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Visual Event Recognition in Surveillance Video Sequences",
        JOURNAL = MultMed,
        VOLUME = "9",
        YEAR = "2007",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "257-267",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157468"}

@inproceedings{bb162006,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Visual Foreground Extraction for Event Characterization",
        BOOKTITLE = SLAM06,
        YEAR = "2006",
        PAGES = "116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157469"}

@inproceedings{bb162007,
        AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
        TITLE = "Audio-Video Integration for Background Modelling",
        BOOKTITLE = ECCV04,
        YEAR = "2004",
        PAGES = "Vol II: 202-213",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157470"}

@article{bb162008,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Liu, M. and Huang, T.S. and Pianfetti, B. and Roth, D. and Levinson, S.",
        TITLE = "Audio-Visual Affect Recognition",
        JOURNAL = MultMed,
        VOLUME = "9",
        YEAR = "2007",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "424-428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157471"}

@article{bb162009,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B.M. and Huang, T.S.",
        TITLE = "Audio-Visual Affective Expression Recognition Through Multistream Fused
HMM",
        JOURNAL = MultMed,
        VOLUME = "10",
        YEAR = "2008",
        NUMBER = "4",
        MONTH = "June",
        PAGES = "570-577",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157472"}

@inproceedings{bb162010,
        AUTHOR = "Zeng, Z.H. and Tu, J.L. and Pianfetti, B. and Liu, M. and Zhang, T. and Zhang, Z.Q. and Huang, T.S. and Levinson, S.",
        TITLE = "Audio-Visual Affect Recognition through Multi-Stream Fused HMM for HCI",
        BOOKTITLE = CVPR05,
        YEAR = "2005",
        PAGES = "II: 967-972",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157473"}

@article{bb162011,
        AUTHOR = "Zhang, S.L. and Huang, Q.M. and Jiang, S. and Gao, W. and Tian, Q.",
        TITLE = "Affective Visualization and Retrieval for Music Video",
        JOURNAL = MultMed,
        VOLUME = "12",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "510-522",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157474"}

@article{bb162012,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Hua, G. and Huang, Q.M. and Gao, W.",
        TITLE = "Generating Descriptive Visual Words and Visual Phrases for Large-Scale
Image Applications",
        JOURNAL = IP,
        VOLUME = "20",
        YEAR = "2011",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2664-2677",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157475"}

@article{bb162013,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.",
        TITLE = "USB: Ultrashort Binary Descriptor for Fast Visual Matching and
Retrieval",
        JOURNAL = IP,
        VOLUME = "23",
        YEAR = "2014",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3671-3683",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157476"}

@article{bb162014,
        AUTHOR = "Zhang, S.L. and Tian, Q. and Huang, Q.M. and Gao, W. and Rui, Y.",
        TITLE = "Cascade Category-Aware Visual Search",
        JOURNAL = IP,
        VOLUME = "23",
        YEAR = "2014",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "2514-2527",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157477"}

@article{bb162015,
        AUTHOR = "Irie, G. and Satou, T. and Kojima, A. and Yamasaki, T. and Aizawa, K.",
        TITLE = "Affective Audio-Visual Words and Latent Topic Driving Model for
Realizing Movie Affective Scene Classification",
        JOURNAL = MultMed,
        VOLUME = "12",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "523-535",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157478"}

@article{bb162016,
        AUTHOR = "Ibrahim, Z.A. and Ferrane, I. and Joly, P.",
        TITLE = "A Similarity-Based Approach for Audiovisual Document Classification
Using Temporal Relation Analysis",
        JOURNAL = JIVP,
        VOLUME = "2011",
        YEAR = "2011",
        NUMBER = "2011",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157479"}

@inproceedings{bb162017,
        AUTHOR = "Philippeau, J. and Pinquier, J. and Joly, P. and Carrive, J.",
        TITLE = "Dynamic organization of audiovisual database using a user-defined
similarity measure based on low-level features",
        BOOKTITLE = ICIP08,
        YEAR = "2008",
        PAGES = "33-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157480"}

@inproceedings{bb162018,
        AUTHOR = "Haidar, S. and Joly, P. and Chebaro, B.",
        TITLE = "Style Similarity Measure for Video Documents Comparison",
        BOOKTITLE = CIVR05,
        YEAR = "2005",
        PAGES = "307-317",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157481"}

@article{bb162019,
        AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.",
        TITLE = "Content-Based Analysis Improves Audiovisual Archive Retrieval",
        JOURNAL = MultMed,
        VOLUME = "14",
        YEAR = "2012",
        NUMBER = "4",
        PAGES = "1166-1178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157482"}

@inproceedings{bb162020,
        AUTHOR = "Huurnink, B. and Snoek, C.G.M. and de Rijke, M. and Smeulders, A.W.M.",
        TITLE = "Today's and tomorrow's retrieval practice in the audiovisual archive",
        BOOKTITLE = CIVR10,
        YEAR = "2010",
        PAGES = "18-25",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157483"}

@inproceedings{bb162021,
        AUTHOR = "Huurnink, B. and de Rijke, M.",
        TITLE = "The value of stories for speech-based video search",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "266-271",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157484"}

@article{bb162022,
        AUTHOR = "Jhuo, I.H. and Ye, G.N. and Gao, S.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.",
        TITLE = "Discovering joint audio-visual codewords for video event detection",
        JOURNAL = MVA,
        VOLUME = "25",
        YEAR = "2014",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "33-47",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157485"}

@inproceedings{bb162023,
        AUTHOR = "Ye, G.N. and Jhuo, I.H. and Liu, D. and Jiang, Y.G. and Lee, D.T. and Chang, S.F.",
        TITLE = "Joint audio-visual bi-modal codewords for video event detection",
        BOOKTITLE = ICMR12,
        YEAR = "2012",
        PAGES = "39",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157486"}

@article{bb162024,
        AUTHOR = "Feki, I. and Ben Ammar, A. and Alimi, A.M.",
        TITLE = "Automatic environmental sound concepts discovery for video retrieval",
        JOURNAL = MultInfoRetr,
        VOLUME = "5",
        YEAR = "2016",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "105-115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157487"}

@article{bb162025,
        AUTHOR = "Khan, M.U.G. and Gotoh, Y.",
        TITLE = "Generating natural language tags for video information management",
        JOURNAL = MVA,
        VOLUME = "28",
        YEAR = "2017",
        NUMBER = "3-4",
        MONTH = "May",
        PAGES = "243-265",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157488"}

@inproceedings{bb162026,
        AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.",
        TITLE = "Generating coherent natural language annotations for video streams",
        BOOKTITLE = ICIP12,
        YEAR = "2012",
        PAGES = "2893-2896",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157489"}

@inproceedings{bb162027,
        AUTHOR = "Khan, M.U.G. and Zhang, L. and Gotoh, Y.",
        TITLE = "Towards coherent natural language description of video streams",
        BOOKTITLE = SIG11,
        YEAR = "2011",
        PAGES = "664-671",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157490"}

@inproceedings{bb162028,
        AUTHOR = "Zhang, L. and Khan, M.U.G. and Gotoh, Y.",
        TITLE = "Video scene classification based on natural language description",
        BOOKTITLE = ARTEMIS11,
        YEAR = "2011",
        PAGES = "942-949",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157491"}

@inproceedings{bb162029,
        AUTHOR = "Peri, D. and Sah, S. and Ptucha, R.",
        TITLE = "Show, Translate and Tell",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "295-299",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157492"}

@inproceedings{bb162030,
        AUTHOR = "Chen, K. and Zhang, C. and Fang, C. and Wang, Z. and Bui, T. and Nevatia, R.",
        TITLE = "Visually Indicated Sound Generation by Perceptually Optimized
Classification",
        BOOKTITLE = MultLearnApp18,
        YEAR = "2018",
        PAGES = "VI:560-574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157493"}

@inproceedings{bb162031,
        AUTHOR = "Haurilet, M.L. and Tapaswi, M. and Al Halah, Z. and Stiefelhagen, R.",
        TITLE = "Naming TV characters by watching and analyzing dialogs",
        BOOKTITLE = WACV16,
        YEAR = "2016",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157494"}

@inproceedings{bb162032,
        AUTHOR = "Numano, S. and Enami, N. and Ariki, Y.",
        TITLE = "Task-Driven Saliency Detection on Music Video",
        BOOKTITLE = CV4AC14,
        YEAR = "2014",
        PAGES = "658-671",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157495"}

@inproceedings{bb162033,
        AUTHOR = "Scott, D. and Zhang, Z.X. and Albatal, R. and McGuinness, K. and Acar, E. and Hopfgartner, F. and Gurrin, C. and O'Connor, N.E. and Smeaton, A.F.",
        TITLE = "Audio-Visual Classification Video Browser",
        BOOKTITLE = MMMod14,
        YEAR = "2014",
        PAGES = "II: 398-401",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157496"}

@inproceedings{bb162034,
        AUTHOR = "Lin, Y.T. and Tsai, T.H. and Hu, M.C. and Cheng, W.H. and Wu, J.L.",
        TITLE = "Semantic Based Background Music Recommendation for Home Videos",
        BOOKTITLE = MMMod14,
        YEAR = "2014",
        PAGES = "II: 283-290",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157497"}

@inproceedings{bb162035,
        AUTHOR = "Shamma, D.A. and Kennedy, L. and Churchill, E.F.",
        TITLE = "Watching and talking: media content as social nexus",
        BOOKTITLE = ICMR12,
        YEAR = "2012",
        PAGES = "12",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157498"}

@inproceedings{bb162036,
        AUTHOR = "Nowak, S. and Paduschek, R. and Kuhhirt, U.",
        TITLE = "Photo summary: automated selection of representative photos from a
digital collection",
        BOOKTITLE = ICMR11,
        YEAR = "2011",
        PAGES = "75",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157499"}

@inproceedings{bb162037,
        AUTHOR = "Paduschek, R. and Nowak, S. and Kuhhirt, U.",
        TITLE = "Automated detection of errors and quality issues in audio-visual
content",
        BOOKTITLE = ICMR11,
        YEAR = "2011",
        PAGES = "74",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157500"}

@inproceedings{bb162038,
        AUTHOR = "Vretos, N. and Nikolaidis, N. and Pitas, I.",
        TITLE = "The use of Audio-Visual Description Profile in 3D video content
description",
        BOOKTITLE = "3DTV12",
        YEAR = "2012",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157501"}

@inproceedings{bb162039,
        AUTHOR = "Ta, A.P. and Ben, M. and Gravier, G.",
        TITLE = "Improving Cluster Selection and Event Modeling in Unsupervised Mining
for Automatic Audiovisual Video Structuring",
        BOOKTITLE = MMMod12,
        YEAR = "2012",
        PAGES = "529-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157502"}

@inproceedings{bb162040,
        AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.",
        TITLE = "Improving Cross-Domain Concept Detection via Object-Based Features",
        BOOKTITLE = CAIP15,
        YEAR = "2015",
        PAGES = "II:359-370",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157503"}

@inproceedings{bb162041,
        AUTHOR = "Muhling, M. and Ewerth, R. and Freisleben, B.",
        TITLE = "On the Spatial Extents of SIFT Descriptors for Visual Concept Detection",
        BOOKTITLE = CVS11,
        YEAR = "2011",
        PAGES = "71-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157504"}

@inproceedings{bb162042,
        AUTHOR = "Muhling, M. and Ewerth, R. and Zhou, J. and Freisleben, B.",
        TITLE = "Multimodal Video Concept Detection via Bag of Auditory Words and
Multiple Kernel Learning",
        BOOKTITLE = MMMod12,
        YEAR = "2012",
        PAGES = "40-50",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157505"}

@inproceedings{bb162043,
        AUTHOR = "Valio, F.B. and Pedrini, H. and Leite, N.J.",
        TITLE = "Fast Rotation-Invariant Video Caption Detection Based on Visual Rhythm",
        BOOKTITLE = CIARP11,
        YEAR = "2011",
        PAGES = "157-164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157506"}

@inproceedings{bb162044,
        AUTHOR = "Gianni, F. and Pinquier, J. and Irisa, E.K.",
        TITLE = "ACADI showcase: Automatic character indexing in audiovisual document",
        BOOKTITLE = CIVR07,
        YEAR = "2007",
        PAGES = "109-112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157507"}

@inproceedings{bb162045,
        AUTHOR = "Putthividhy, D. and Attias, H.T. and Nagarajan, S.S.",
        TITLE = "Topic regression multi-modal Latent Dirichlet Allocation for image
annotation",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "3408-3415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157508"}

@inproceedings{bb162046,
        AUTHOR = "Jung, K.H. and Choi, S.H. and Kim, H.S. and Hur, N.H. and Kim, J.K.",
        TITLE = "Caption insertion method for 3D broadcasting service",
        BOOKTITLE = "3DTV10",
        YEAR = "2010",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157509"}

@inproceedings{bb162047,
        AUTHOR = "Pramod, S.K. and Jawahar, C.V. and Zisserman, A.",
        TITLE = "Subtitle-free Movie to Script Alignment",
        BOOKTITLE = BMVC09,
        YEAR = "2009",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157510"}

@inproceedings{bb162048,
        AUTHOR = "Zeng, Z. and Liang, W. and Li, H.P. and Zhang, S.W.",
        TITLE = "A Novel Video Classification Method Based on Hybrid
Generative/Discriminative Models",
        BOOKTITLE = SSPR08,
        YEAR = "2008",
        PAGES = "705-713",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157511"}

@inproceedings{bb162049,
        AUTHOR = "Zhu, Y.Y. and Ming, Z. and Huang, Q.A.",
        TITLE = "SVM-Based Audio Classification for Content- Based Multimedia Retrieval",
        BOOKTITLE = MCAM07,
        YEAR = "2007",
        PAGES = "474-482",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157512"}

@inproceedings{bb162050,
        AUTHOR = "Goldmann, L. and Samour, A. and Karaman, M. and Sikora, T.",
        TITLE = "Extracting High Level Semantics by Means of Speech, Audio, and Image
Primitives in Surveillance Applications",
        BOOKTITLE = ICIP06,
        YEAR = "2006",
        PAGES = "2397-2400",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157513"}

@inproceedings{bb162051,
        AUTHOR = "Luo, J. and Caputo, B. and Zweig, A. and Bach, J.H. and Anemuller, J.",
        TITLE = "Object Category Detection Using Audio-Visual Cues",
        BOOKTITLE = CVS08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157514"}

@inproceedings{bb162052,
        AUTHOR = "Caputo, B. and Wallraven, C. and Nilsback, M.E.",
        TITLE = "Object categorization via local kernels",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "II: 132-135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157515"}

@inproceedings{bb162053,
        AUTHOR = "Divakaran, A. and Peker, K.A. and Radhakrishnan, R. and Xiong, Z.Y. and Cabasson, R.",
        TITLE = "Video Summarization using MPEG-7 Motion Activity and Audio Descriptors",
        BOOKTITLE = VideoMining03,
        YEAR = "2003",
        PAGES = "Chapter 4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157516"}

@inproceedings{bb162054,
        AUTHOR = "Schauer, C. and Gross, H.M.",
        TITLE = "A Computational Model of Early Auditory-Visual Integration",
        BOOKTITLE = DAGM03,
        YEAR = "2003",
        PAGES = "362-369",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157517"}

@inproceedings{bb162055,
        AUTHOR = "Fu, T.Y. and Liu, X.X. and Liang, L.H. and Pi, X.B. and Nefian, A.V.",
        TITLE = "A audio-visual speaker identification using coupled hidden Markov
models",
        BOOKTITLE = ICIP03,
        YEAR = "2003",
        PAGES = "III: 29-32",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157518"}

@inproceedings{bb162056,
        AUTHOR = "Yemez, Y. and Kanak, A. and Erzin, E. and Tekalp, A.M.",
        TITLE = "Multimodal speaker identification with audio-video processing",
        BOOKTITLE = ICIP03,
        YEAR = "2003",
        PAGES = "III: 5-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157519"}

@inproceedings{bb162057,
        AUTHOR = "Sugano, M. and Isaksson, R. and Nakajima, Y. and Yanagihara, H.",
        TITLE = "Shot genre classification using compressed audio-visual features",
        BOOKTITLE = ICIP03,
        YEAR = "2003",
        PAGES = "II: 17-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157520"}

@inproceedings{bb162058,
        AUTHOR = "Moncrieff, S. and Venkatesh, S. and Dorai, C.",
        TITLE = "Horror film genre typing and scene labeling via audio analysis",
        BOOKTITLE = "ICME03",
        YEAR = "2003",
        PAGES = "I: 193-196",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157521"}

@inproceedings{bb162059,
        AUTHOR = "Moncrieff, S. and Dorai, C. and Venkatesh, S.",
        TITLE = "Affect computing in film through sound energy dynamics",
        BOOKTITLE = "ACMMM01",
        YEAR = "2001",
        PAGES = "525-527",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157522"}

@inproceedings{bb162060,
        AUTHOR = "Wachsmuth, S. and Sagerer, G.",
        TITLE = "Integrated analysis of speech and images as a probabilistic decoding
process",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "II: 588-592",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157523"}

@inproceedings{bb162061,
        AUTHOR = "Kulesh, V. and Petrushin, V.A. and Sethi, I.K.",
        TITLE = "Video clip recognition using joint audio-visual processing model",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "I: 500-503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157524"}

@inproceedings{bb162062,
        AUTHOR = "Miyamori, H.",
        TITLE = "Improving accuracy in behaviour identification for content-based
retrieval by using audio and video information",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "II: 826-830",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157525"}

@inproceedings{bb162063,
        AUTHOR = "de Santo, M. and Percannella, G. and Sansone, C. and Vento, M.",
        TITLE = "Classifying audio of movies by a multi-expert system",
        BOOKTITLE = CIAP01,
        YEAR = "2001",
        PAGES = "386-391",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157526"}

@inproceedings{bb162064,
        AUTHOR = "Albiol, A. and Torres, L. and Delp, E.J.",
        TITLE = "Video preprocessing for audiovisual indexing",
        BOOKTITLE = Southwest02,
        YEAR = "2002",
        PAGES = "57-61",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157527"}

@inproceedings{bb162065,
        AUTHOR = "Bakker, E.M. and Lew, M.S.",
        TITLE = "Semantic Video Retrieval Using Audio Analysis",
        BOOKTITLE = CIVR02,
        YEAR = "2002",
        PAGES = "271-277",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157528"}

@inproceedings{bb162066,
        AUTHOR = "Kim, K. and Choi, J. and Kim, N. and Kim, P.K.",
        TITLE = "Extracting Semantic Information from Basketball Video Based on
Audio-Visual Features",
        BOOKTITLE = CIVR02,
        YEAR = "2002",
        PAGES = "278-288",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157529"}

@inproceedings{bb162067,
        AUTHOR = "Fisher, J.W. and Darrell, T.J.",
        TITLE = "Probabalistic Models and Informative Subspaces for Audiovisual
Correspondence",
        BOOKTITLE = ECCV02,
        YEAR = "2002",
        PAGES = "III: 592 ff.",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157530"}

@inproceedings{bb162068,
        AUTHOR = "Chu, S.M. and Huang, T.S.",
        TITLE = "Audio-Visual Speech Fusion Using Coupled Hidden Markov Models",
        BOOKTITLE = MSCSAS07,
        YEAR = "2007",
        PAGES = "1-2",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157531"}

@inproceedings{bb162069,
        AUTHOR = "Naphade, M.R. and Garg, A. and Huang, T.S.",
        TITLE = "Audio-Visual Event Detection using Duration Dependent Input Output
Markov Models",
        BOOKTITLE = CBAIVL01,
        YEAR = "2001",
        PAGES = "30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157532"}

@inproceedings{bb162070,
        AUTHOR = "Alatan, A.A.",
        TITLE = "Automatic Multi-modal Dialogue Scene Indexing",
        BOOKTITLE = ICIP01,
        YEAR = "2001",
        PAGES = "III: 374-377",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157533"}

@inproceedings{bb162071,
        AUTHOR = "Smith, M.A. and Kanade, T.",
        TITLE = "Video Skimming and Characterization through the Combination of
Image and Language Understanding Techniques",
        BOOKTITLE = CVPR97,
        YEAR = "1997",
        PAGES = "775-781",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157534"}

@inproceedings{bb162072,
        AUTHOR = "Kanade, T. and Smith, M.A.",
        TITLE = "Video Skimming and Characterization through the Combination of
Image and Language Understanding Techniques",
        BOOKTITLE = DARPA97,
        YEAR = "1997",
        PAGES = "357-366",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157534"}

@inproceedings{bb162073,
        AUTHOR = "Kanade, T. and Smith, M.A.",
        TITLE = "Video Skimming and Characterization through the Combination of
Image and Language Understanding Techniques",
        BOOKTITLE = CMU-CS-TR,
        YEAR = "1997",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157534"}

@inproceedings{bb162074,
        AUTHOR = "Smith, M.A. and Kanade, T.",
        TITLE = "Video Skimming for Quick Browsing based on Audio and
Image Characterization",
        BOOKTITLE = CMU-CS-TR,
        YEAR = "1995",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157535"}

@inproceedings{bb162075,
        AUTHOR = "Sundaram, H. and Chang, S.F.",
        TITLE = "Video Scene Segmentation Using Video and Audio Features",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "TP10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157536"}

@inproceedings{bb162076,
        AUTHOR = "Smith, J.R. and Li, C.S.",
        TITLE = "Adaptive Synthesis in Progressive Retrieval of Audio-Visual Data",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "MP5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157537"}

@inproceedings{bb162077,
        AUTHOR = "Toklu, C. and Liou, S.P.",
        TITLE = "Image and Audio Sequence Visualization and Interaction Mechanisms for
Structured Video Browsing and Editing",
        BOOKTITLE = ICIP00,
        YEAR = "2000",
        PAGES = "Vol II: 263-266",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157538"}

@inproceedings{bb162078,
        AUTHOR = "Jiang, H. and Lin, T. and Zhang, H.J.",
        TITLE = "Video Segmentation with the Assistance of Audio Content Analysis",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "WP5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157539"}

@inproceedings{bb162079,
        AUTHOR = "Sugano, M. and Nakajima, Y. and Yanagihara, H.",
        TITLE = "Automated MPEG audio-video summarization and description",
        BOOKTITLE = ICIP02,
        YEAR = "2002",
        PAGES = "I: 956-959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157540"}

@inproceedings{bb162080,
        AUTHOR = "Pandit, M. and Kittler, J.V. and Li, Y. and Chilton, E.",
        TITLE = "A Comparative Study of Different Segmentation Approaches for Audio
Track Indexing",
        BOOKTITLE = ICPR00,
        YEAR = "2000",
        PAGES = "Vol II: 467-470",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157541"}

@inproceedings{bb162081,
        AUTHOR = "Huang, J.C. and Liu, Z. and Yao, W.",
        TITLE = "Integration of audio and visual information for content-based video
segmentation",
        BOOKTITLE = ICIP98,
        YEAR = "1998",
        PAGES = "III: 526-529",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157542"}

@inproceedings{bb162082,
        AUTHOR = "Saraceno, C. and Leonardi, R.",
        TITLE = "Identification of story units in audio-visual sequences by joint audio
and video processing",
        BOOKTITLE = ICIP98,
        YEAR = "1998",
        PAGES = "I: 363-367",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823av1.html#TT157543"}

@article{bb162083,
        AUTHOR = "Ahanger, G. and Little, T.D.C.",
        TITLE = "A Survey of Technologies for Parsing and Indexing Digital Video",
        JOURNAL = JVCIR,
        VOLUME = "7",
        YEAR = "1996",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "28-43",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157544"}

@article{bb162084,
        AUTHOR = "Boreczky, J.S. and Rowe, L.A.",
        TITLE = "Comparison of Video Shot Boundary Detection Techniques",
        JOURNAL = JEI,
        VOLUME = "5",
        YEAR = "1996",
        NUMBER = "2",
        MONTH = "April",
        PAGES = "122-128",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157545"}

@article{bb162085,
        AUTHOR = "Rowe, L.A. and Boreczky, J.S.",
        TITLE = "Comparison of Video Shot Boundary Detection Techniques",
        JOURNAL = SPIE,
        VOLUME = "2670",
        YEAR = "1996",
        PAGES = "170-179",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157545"}

@inproceedings{bb162086,
        AUTHOR = "Wilcox, L.D. and Boreczky, J.S.",
        TITLE = "Automatic video segmentation using hidden markov model",
        BOOKTITLE = US_Patent,
        YEAR = "2000",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157546"}

@article{bb162087,
        AUTHOR = "Gargi, U. and Kasturi, R. and Strayer, S.H.",
        TITLE = "Performance Characterization of Video-Shot-Change Detection Methods",
        JOURNAL = CirSysVideo,
        VOLUME = "10",
        YEAR = "2000",
        NUMBER = "1",
        MONTH = "February",
        PAGES = "1",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157547"}

@article{bb162088,
        AUTHOR = "Jeannin, S.",
        TITLE = "Motion descriptors for content-based video representation",
        JOURNAL = SP:IC,
        VOLUME = "16",
        YEAR = "2000",
        NUMBER = "1-2",
        MONTH = "September",
        PAGES = "59-85",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157548"}

@article{bb162089,
        AUTHOR = "Brunelli, R. and Mich, O. and Modena, C.M.",
        TITLE = "A Survey on the Automatic Indexing of Video Data",
        JOURNAL = JVCIR,
        VOLUME = "10",
        YEAR = "1999",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "78-112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157549"}

@article{bb162090,
        AUTHOR = "Koprinska, I. and Carrato, S.",
        TITLE = "Temporal video segmentation: A survey",
        JOURNAL = SP:IC,
        VOLUME = "16",
        YEAR = "2001",
        NUMBER = "5",
        MONTH = "January",
        PAGES = "477-500",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157550"}

@article{bb162091,
        AUTHOR = "Lefevre, S. and Holler, J. and Vincent, N.",
        TITLE = "A review of real-time segmentation of uncompressed video sequences for
content-based search and retrieval",
        JOURNAL = RealTimeImg,
        VOLUME = "9",
        YEAR = "2003",
        NUMBER = "1",
        MONTH = "February",
        PAGES = "73-98",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157551"}

@article{bb162092,
        AUTHOR = "Yahiaoui, I. and Merialdo, B. and Huet, B.",
        TITLE = "Comparison of Multiepisode Video Summarisation Algorithms",
        JOURNAL = JASP,
        VOLUME = "2003",
        YEAR = "2003",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "48",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157552"}

@article{bb162093,
        AUTHOR = "Suter, D. and Comaniciu, D. and Kanatani, K.",
        TITLE = "Special issue on statistical methods in video processing",
        JOURNAL = IVC,
        VOLUME = "22",
        YEAR = "2004",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "83-84",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157553"}

@article{bb162094,
        AUTHOR = "Friedland, G. and Rojas, R.",
        TITLE = "Anthropocentric Video Segmentation for Lecture Webcasts",
        JOURNAL = JIVP,
        VOLUME = "2008",
        YEAR = "2008",
        NUMBER = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157554"}

@article{bb162095,
        AUTHOR = "Money, A.G. and Agius, H.",
        TITLE = "Video summarisation:
A conceptual framework and survey of the state of the art",
        JOURNAL = JVCIR,
        VOLUME = "19",
        YEAR = "2008",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "121-143",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157555"}

@article{bb162096,
        AUTHOR = "Ciocca, G.",
        TITLE = "A Robust Multi-Feature Cut Detection Algorithm for Video Segmentation",
        JOURNAL = ELCVIA,
        VOLUME = "9",
        YEAR = "2010",
        NUMBER = "No. 1",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157556"}

@article{bb162097,
        AUTHOR = "Wu, F. and Han, Y.H. and Liu, X. and Shao, J.",
        TITLE = "The heterogeneous feature selection with structural sparsity for
multimedia annotation and hashing: a survey",
        JOURNAL = MultInfoRetr,
        VOLUME = "1",
        YEAR = "2012",
        NUMBER = "1",
        MONTH = "April",
        PAGES = "3-15",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157557"}

@inproceedings{bb162098,
        AUTHOR = "Santos, S.M. and Borges, D.L. and Gomes, H.M.",
        TITLE = "An Evaluation of Video Cut Detection Techniques",
        BOOKTITLE = CIARP07,
        YEAR = "2007",
        PAGES = "311-320",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157558"}

@inproceedings{bb162099,
        AUTHOR = "d'Anna, L. and Marrazzo, G. and Percannella, G. and Sansone, C. and Vento, M.",
        TITLE = "A Multi-stage Approach for Anchor Shot Detection",
        BOOKTITLE = SSPR06,
        YEAR = "2006",
        PAGES = "773-782",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat823.html#TT157559"}

Last update:Dec 23, 2019 at 15:47:08