@inproceedings{bb282300, AUTHOR = "Chao, F.Y. and Ozcinar, C. and Zhang, L. and Hamidouche, W. and Deforges, O. and Smolic, A.", TITLE = "Towards Audio-Visual Saliency Prediction for Omnidirectional Video with Spatial Audio", BOOKTITLE = VCIP20, YEAR = "2020", PAGES = "355-358", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT276997"} @inproceedings{bb282301, AUTHOR = "Zhou, H. and Xu, X.D. and Lin, D. and Wang, X.G. and Liu, Z.W.", TITLE = "Sep-stereo: Visually Guided Stereophonic Audio Generation by Associating Source Separation", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XII: 52-69", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT276998"} @inproceedings{bb282302, AUTHOR = "Tian, Y.P. and Li, D.Z. and Xu, C.L.", TITLE = "Unified Multisensory Perception: Weakly-supervised Audio-visual Video Parsing", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "III:436-454", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT276999"} @inproceedings{bb282303, AUTHOR = "Salman, A.N. and Busso, C.", TITLE = "Dynamic versus Static Facial Expressions in the Presence of Speech", BOOKTITLE = FG20, YEAR = "2020", PAGES = "436-443", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277000"} @inproceedings{bb282304, AUTHOR = "Salman, A.N. and Busso, C. and Salman, A.N. and Busso, C.", TITLE = "Style Extractor For Facial Expression Recognition in the Presence of Speech", BOOKTITLE = ICIP20, YEAR = "2020", PAGES = "1806-1810", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277001"} @inproceedings{bb282305, AUTHOR = "Liu, Y.F. and Qiao, M.L. and Xu, M. and Li, B. and Hu, W.M. and Borji, A.", TITLE = "Learning to Predict Salient Faces: A Novel Visual-Audio Saliency Model", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XX:413-429", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277002"} @inproceedings{bb282306, AUTHOR = "Yang, K. and Russell, B. and Salamon, J.", TITLE = "Telling Left From Right: Learning Spatial Correspondence of Sight and Sound", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "9929-9938", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277003"} @inproceedings{bb282307, AUTHOR = "Gao, R. and Oh, T. and Grauman, K. and Torresani, L.", TITLE = "Listen to Look: Action Recognition by Previewing Audio", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10454-10464", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277004"} @inproceedings{bb282308, AUTHOR = "Zhang, X. and Wu, X. and Zhai, X. and Ben, X. and Tu, C.", TITLE = "DAVD-Net: Deep Audio-Aided Video Decompression of Talking Heads", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "12332-12341", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277005"} @inproceedings{bb282309, AUTHOR = "Vaezi Joze, H.R. and Shaban, A. and Iuzzolino, M.L. and Koishida, K.", TITLE = "MMTM: Multimodal Transfer Module for CNN Fusion", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "13286-13296", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277006"} @inproceedings{bb282310, AUTHOR = "Alcazar, J.L. and Caba, F. and Mai, L. and Perazzi, F. and Lee, J. and Arbelaez, P. and Ghanem, B.", TITLE = "Active Speakers in Context", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "12462-12471", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277007"} @inproceedings{bb282311, AUTHOR = "Huang, C. and Koishida, K.", TITLE = "Improved Active Speaker Detection based on Optical Flow", BOOKTITLE = MULWS20, YEAR = "2020", PAGES = "4084-4090", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277008"} @inproceedings{bb282312, AUTHOR = "Ma, X.J. and Wu, C.C. and Li, Y.Y. and Zhong, Q.Y.", TITLE = "Speaker Identification System Based on Lip-Motion Feature", BOOKTITLE = CVS17, YEAR = "2017", PAGES = "289-299", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277009"} @inproceedings{bb282313, AUTHOR = "Xu, B. and Lu, C. and Guo, Y. and Wang, J.", TITLE = "Discriminative Multi-Modality Speech Recognition", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "14421-14430", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277010"} @inproceedings{bb282314, AUTHOR = "Subedar, M. and Krishnan, R. and Meyer, P.L. and Tickoo, O. and Huang, J.", TITLE = "Uncertainty-Aware Audiovisual Activity Recognition Using Deep Bayesian Variational Inference", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "6300-6309", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277011"} @inproceedings{bb282315, AUTHOR = "Alamri, H. and Cartillier, V. and Das, A. and Wang, J. and Cherian, A. and Essa, I. and Batra, D. and Marks, T.K. and Hori, C. and Anderson, P. and Lee, S. and Parikh, D.", TITLE = "Audio Visual Scene-Aware Dialog", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "7550-7559", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277012"} @inproceedings{bb282316, AUTHOR = "Niu, Y.L. and Zhang, H.W. and Zhang, M.L. and Zhang, J.H. and Lu, Z.W. and Wen, J.R.", TITLE = "Recursive Visual Attention in Visual Dialog", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6672-6681", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277013"} @inproceedings{bb282317, AUTHOR = "Schwartz, I. and Schwing, A.G. and Hazan, T.", TITLE = "A Simple Baseline for Audio-Visual Scene-Aware Dialog", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "12540-12550", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277014"} @inproceedings{bb282318, AUTHOR = "Lu, Y. and Lee, H. and Tseng, H. and Yang, M.", TITLE = "Self-Supervised Audio Spatialization with Correspondence Classifier", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "3347-3351", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277015"} @inproceedings{bb282319, AUTHOR = "Meng, D. and Peng, X. and Wang, K. and Qiao, Y.", TITLE = "Frame Attention Networks for Facial Expression Recognition in Videos", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "3866-3870", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277016"} @inproceedings{bb282320, AUTHOR = "Shahid, M. and Beyan, C. and Murino, V.", TITLE = "Comparisons of Visual Activity Primitives for Voice Activity Detection", BOOKTITLE = CIAP19, YEAR = "2019", PAGES = "I:48-59", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277017"} @inproceedings{bb282321, AUTHOR = "Kim, C.I. and Shin, H.J.V. and Oh, T.H. and Kaspar, A. and Elgharib, M. and Matusik, W.", TITLE = "On Learning Associations of Faces and Voices", BOOKTITLE = ACCV18, YEAR = "2018", PAGES = "V:276-292", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277018"} @inproceedings{bb282322, AUTHOR = "Schindler, A. and Boyer, M. and Lindley, A. and Schreiber, D. and Philipp, T.", TITLE = "Large Scale Audio-Visual Video Analytics Platform for Forensic Investigations of Terroristic Attacks", BOOKTITLE = "MMMod19", YEAR = "2019", PAGES = "II:106-119", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277019"} @inproceedings{bb282323, AUTHOR = "Oliveira, D.A.B. and Mattos, A.B. and da Silva Morais, E.", TITLE = "Improving Viseme Recognition Using GAN-Based Frontal View Mapping", BOOKTITLE = AMFG18, YEAR = "2018", PAGES = "2229-22297", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277020"} @inproceedings{bb282324, AUTHOR = "Yang, X. and Molchanov, P. and Kautz, J.", TITLE = "Making Convolutional Networks Recurrent for Visual Sequence Learning", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "6469-6478", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277021"} @inproceedings{bb282325, AUTHOR = "Zhang, J. and Richmond, K. and Fisher, R.B.", TITLE = "Dual-modality Talking-metrics: 3D Visual-Audio Integrated Behaviometric Cues from Speakers", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "3144-3149", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277022"} @inproceedings{bb282326, AUTHOR = "Chowdhury, A. and Atoum, Y. and Tran, L. and Liu, X. and Ross, A.", TITLE = "MSU-AVIS dataset: Fusing Face and Voice Modalities for Biometric Recognition in Indoor Surveillance Videos", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "3567-3573", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277023"} @inproceedings{bb282327, AUTHOR = "Nagrani, A. and Albanie, S. and Zisserman, A.", TITLE = "Seeing Voices and Hearing Faces: Cross-Modal Biometric Matching", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "8427-8436", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277024"} @inproceedings{bb282328, AUTHOR = "Saitoh, T. and Kubokawa, M.", TITLE = "SSSD: Speech Scene database by Smart Device for Visual Speech Recognition", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "3228-3232", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277025"} @inproceedings{bb282329, AUTHOR = "Owens, A. and Efros, A.A.", TITLE = "Audio-Visual Scene Analysis with Self-Supervised Multisensory Features", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "VI: 639-658", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277026"} @inproceedings{bb282330, AUTHOR = "Berlin, A.A. and Surati, R.", TITLE = "Video Deconfounding: Hearing-Aid Inspired Video Enhancement", BOOKTITLE = IVMSP18, YEAR = "2018", PAGES = "1-5", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277027"} @inproceedings{bb282331, AUTHOR = "Ding, R. and Pang, C. and Liu, H.", TITLE = "Audio-Visual Keyword Spotting Based on Multidimensional Convolutional Neural Network", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "4138-4142", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277028"} @inproceedings{bb282332, AUTHOR = "Liao, J. and Wang, S. and Zhang, X. and Liu, G.", TITLE = "3D Convolutional Neural Networks Based Speaker Identification and Authentication", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "2042-2046", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277029"} @inproceedings{bb282333, AUTHOR = "Savran, A. and Tavarone, R. and Higy, B. and Badino, L. and Bartolozzi, C.", TITLE = "Energy and Computation Efficient Audio-Visual Voice Activity Detection Driven by Event-Cameras", BOOKTITLE = FG18, YEAR = "2018", PAGES = "333-340", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277030"} @inproceedings{bb282334, AUTHOR = "Ephrat, A. and Halperin, T. and Peleg, S.", TITLE = "Improved Speech Reconstruction from Silent Video", BOOKTITLE = CVAVM17, YEAR = "2017", PAGES = "455-462", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277031"} @inproceedings{bb282335, AUTHOR = "Ahn, J. and Kim, Y.J. and Kim, D.J.", TITLE = "Patch-based visual microphone for improving quality of sound", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "3927-3932", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277032"} @inproceedings{bb282336, AUTHOR = "Miao, C.L. and Feng, J.W. and Ding, Y. and Yang, Y. and Chen, X.G. and Ji, X.Y.", TITLE = "Unsupervised person clustering in videos with cross-modal communication", BOOKTITLE = VCIP16, YEAR = "2016", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277033"} @inproceedings{bb282337, AUTHOR = "Hu, D. and Li, X.L. and Lu, X.Q.", TITLE = "Temporal Multimodal Learning in Audiovisual Speech Recognition", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "3574-3582", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277034"} @inproceedings{bb282338, AUTHOR = "Liu, H. and Fan, T. and Wu, P.P.", TITLE = "Audio-visual Keyword Spotting for Mandarin Based on Discriminative Local Spatial-Temporal Descriptors", BOOKTITLE = ICPR14, YEAR = "2014", PAGES = "785-790", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277035"} @inproceedings{bb282339, AUTHOR = "Ringeval, F. and Sonderegger, A. and Sauer, J. and Lalanne, D.", TITLE = "Introducing the RECOLA multimodal corpus of remote collaborative and affective interactions", BOOKTITLE = FG13, YEAR = "2013", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277036"} @inproceedings{bb282340, AUTHOR = "Aubrey, A.J. and Cunningham, D.W. and Marshall, D. and Rosin, P.L. and Shin, A.", TITLE = "The Face Speaks: Contextual and Temporal Sensitivity to Backchannel Responses", BOOKTITLE = FaceCVHum12, YEAR = "2012", PAGES = "II:248-259", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277037"} @inproceedings{bb282341, AUTHOR = "Tawari, A. and Trivedi, M.", TITLE = "Audio-visual data association for face expression analysis", BOOKTITLE = ICPR12, YEAR = "2012", PAGES = "1120-1123", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277038"} @inproceedings{bb282342, AUTHOR = "Taj, M. and Cavallaro, A.", TITLE = "Interaction recognition in wide areas using audiovisual sensors", BOOKTITLE = ICIP12, YEAR = "2012", PAGES = "1113-1116", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277039"} @inproceedings{bb282343, AUTHOR = "Giorgolo, G.", TITLE = "Integration of Gesture and Verbal Language: A Formal Semantics Approach", BOOKTITLE = GW11, YEAR = "2011", PAGES = "216-227", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277040"} @inproceedings{bb282344, AUTHOR = "Le, Q.A. and Pelachaud, C.", TITLE = "Generating Co-speech Gestures for the Humanoid Robot NAO through BML", BOOKTITLE = GW11, YEAR = "2011", PAGES = "228-237", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277041"} @inproceedings{bb282345, AUTHOR = "Navarathna, R. and Dean, D. and Sridharan, S. and Fookes, C. and Lucey, P.", TITLE = "Visual Voice Activity Detection Using Frontal versus Profile Views", BOOKTITLE = DICTA11, YEAR = "2011", PAGES = "134-139", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277042"} @inproceedings{bb282346, AUTHOR = "Komai, Y. and Ariki, Y. and Takiguchi, T.", TITLE = "Audio-Visual Speech Recognition Based on AAM Parameter and Phoneme Analysis of Visual Feature", BOOKTITLE = PSIVT11, YEAR = "2011", PAGES = "I: 97-108", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277043"} @inproceedings{bb282347, AUTHOR = "Zheng, H.M. and Wang, M. and Li, Z.", TITLE = "Audio-visual speaker identification with multi-view distance metric learning", BOOKTITLE = ICIP10, YEAR = "2010", PAGES = "4561-4564", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277044"} @inproceedings{bb282348, AUTHOR = "Krishnan, R.K. and Sarkar, S.", TITLE = "Similarity Measure between Two Gestures Using Triplets", BOOKTITLE = HAU3D13, YEAR = "2013", PAGES = "506-513", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277045"} @inproceedings{bb282349, AUTHOR = "Krishnan, R.K. and Sarkar, S.", TITLE = "Detecting Group Turn Patterns in Conversations Using Audio-Video Change Scale-Space", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "137-140", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277046"} @inproceedings{bb282350, AUTHOR = "Aran, O. and Gatica Perez, D.", TITLE = "Fusing Audio-Visual Nonverbal Cues to Detect Dominant People in Group Conversations", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "3687-3690", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277047"} @inproceedings{bb282351, AUTHOR = "Niese, R. and Al Hamadi, A. and Michaelis, B.", TITLE = "A New Multi-camera Based Facial Expression Analysis Concept", BOOKTITLE = ICIAR12, YEAR = "2012", PAGES = "II: 64-71", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277048"} @inproceedings{bb282352, AUTHOR = "Steer, M.A. and Al Hamadi, A. and Michaelis, B.", TITLE = "Audio-Visual Data Fusion Using a Particle Filter in the Application of Face Recognition", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "4392-4395", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277049"} @inproceedings{bb282353, AUTHOR = "Roy, A. and Marcel, S.", TITLE = "Crossmodal Matching of Speakers Using Lip and Voice Features in Temporally Non-overlapping Audio and Video Streams", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "4504-4507", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277050"} @inproceedings{bb282354, AUTHOR = "Cour, T. and Sapp, B. and Nagle, A. and Taskar, B.", TITLE = "Talking pictures: Temporal grouping and dialog-supervised person recognition", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "1014-1021", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277051"} @inproceedings{bb282355, AUTHOR = "Wu, G.Y. and Zhu, J. and Xu, H.H.", TITLE = "A hybrid visual feature extraction method for audio-visual speech recognition", BOOKTITLE = ICIP09, YEAR = "2009", PAGES = "1829-1832", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277052"} @inproceedings{bb282356, AUTHOR = "Ceballos, A. and Gomez, J. and Prieto, F. and Redarce, T.", TITLE = "Robot Command Interface Using an Audio-Visual Speech Recognition System", BOOKTITLE = CIARP09, YEAR = "2009", PAGES = "869-876", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277053"} @inproceedings{bb282357, AUTHOR = "Cifani, S. and Abel, A. and Hussain, A. and Squartini, S. and Piazza, F.", TITLE = "An Investigation into Audiovisual Speech Correlation in Reverberant Noisy Environments", BOOKTITLE = COST08, YEAR = "2008", PAGES = "331-343", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277054"} @inproceedings{bb282358, AUTHOR = "Lee, J.S. and Ebrahimi, T.", TITLE = "Two-Level Bimodal Association for Audio-Visual Speech Recognition", BOOKTITLE = ACIVS09, YEAR = "2009", PAGES = "133-144", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277055"} @inproceedings{bb282359, AUTHOR = "Marchegiani, M.L. and Pirri, F. and Pizzoli, M.", TITLE = "Multimodal Speaker Recognition in a Conversation Scenario", BOOKTITLE = CVS09, YEAR = "2009", PAGES = "11-20", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277056"} @inproceedings{bb282360, AUTHOR = "Karam, W. and Mokbel, C. and Greige, H. and Chollet, G.", TITLE = "Audio-Visual Identity Verification and Robustness to Imposture", BOOKTITLE = ICB09, YEAR = "2009", PAGES = "796-805", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277057"} @inproceedings{bb282361, AUTHOR = "Rebillat, M. and Katz, B.F.G. and Corteel, E.", TITLE = "SMART-I2: Spatial Multi-user Audio-visual Real-time interactive interface, A broadcast application context", BOOKTITLE = "3DTV09", YEAR = "2009", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277058"} @inproceedings{bb282362, AUTHOR = "Eisenstein, J.", TITLE = "Gesture in Automatic Discourse Processing", BOOKTITLE = CSAIL, YEAR = "2008", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277059"} @inproceedings{bb282363, AUTHOR = "Eisenstein, J.", TITLE = "Gesture in Automatic Discourse Processing", BOOKTITLE = Ph.D., YEAR = "2008", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277059"} @inproceedings{bb282364, AUTHOR = "Das, A. and Manyam, O.K. and Tapaswi, M.", TITLE = "Audio-Visual Person Authentication with Multiple Visualized-Speech Features and Multiple Face Profiles", BOOKTITLE = ICCVGIP08, YEAR = "2008", PAGES = "39-46", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277060"} @inproceedings{bb282365, AUTHOR = "Cao, Y. and Baang, S. and Liu, S.H. and Li, M. and Hu, S.Q.", TITLE = "Audio-visual event classification via spatial-temporal-audio words", BOOKTITLE = ICPR08, YEAR = "2008", PAGES = "1-5", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277061"} @inproceedings{bb282366, AUTHOR = "Terry, L.H. and Shiell, D.J. and Katsaggelos, A.K.", TITLE = "Feature space video stream consistency estimation for dynamic stream weighting in audio-visual speech recognition", BOOKTITLE = ICIP08, YEAR = "2008", PAGES = "1316-1319", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277062"} @inproceedings{bb282367, AUTHOR = "Naseem, I. and Mian, A.S.", TITLE = "User Verification by Combining Speech and Face Biometrics in Video", BOOKTITLE = ISVC08, YEAR = "2008", PAGES = "II: 482-492", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277063"} @inproceedings{bb282368, AUTHOR = "Ettinger, E. and Freund, Y.", TITLE = "Coordinate-free calibration of an acoustically driven camera pointing system", BOOKTITLE = ICDSC08, YEAR = "2008", PAGES = "1-9", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277064"} @inproceedings{bb282369, AUTHOR = "Hung, H. and Friedland, G.", TITLE = "Towards Audio-Visual On-line Diarization Of Participants In Group Meetings", BOOKTITLE = M2SFA208, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277065"} @inproceedings{bb282370, AUTHOR = "Liu, Y.Y. and Sato, Y.", TITLE = "Finding Speaker Face Region by Audiovisual Correlation", BOOKTITLE = M2SFA208, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277066"} @inproceedings{bb282371, AUTHOR = "Pachoud, S. and Gong, S. and Cavallaro, A.", TITLE = "Video Augmentation for Improving Audio Speech Recognition under Noise", BOOKTITLE = BMVC08, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277067"} @inproceedings{bb282372, AUTHOR = "Horii, Y. and Kawashima, H. and Matsuyama, T.", TITLE = "Speaker detection using the timing structure of lip motion and sound", BOOKTITLE = CVPR4HB08, YEAR = "2008", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277068"} @inproceedings{bb282373, AUTHOR = "Rua, E.A. and Castro, J.L.A. and Mateo, C.G.", TITLE = "Quality-Based Score Normalization for Audiovisual Person Authentication", BOOKTITLE = ICIAR08, YEAR = "2008", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277069"} @inproceedings{bb282374, AUTHOR = "Wang, L. and Tjondrongoro, D. and Liu, Y.", TITLE = "Clustering and Visualizing Audio-Visual Dataset on Mobile Devices in a Topic-Oriented Manner", BOOKTITLE = Visual07, YEAR = "2007", PAGES = "310-321", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277070"} @inproceedings{bb282375, AUTHOR = "Zajdel, W. and Krijnders, J.D. and Andringa, T. and Gavrila, D.M.", TITLE = "CASSANDRA: audio-video sensor fusion for aggression detection", BOOKTITLE = AVSBS07, YEAR = "2007", PAGES = "200-205", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277071"} @inproceedings{bb282376, AUTHOR = "Stodle, D. and Bjorndalen, J.M. and Anshus, O.J.", TITLE = "A System for Hybrid Vision- and Sound-Based Interaction with Distal and Proximal Targets on Wall-Sized, High-Resolution Tiled Displays", BOOKTITLE = CVHCI07, YEAR = "2007", PAGES = "59-68", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277072"} @inproceedings{bb282377, AUTHOR = "van Hengel, P.W.J. and Andringa, T.C.", TITLE = "Verbal aggression detection in complex social environments", BOOKTITLE = AVSBS07, YEAR = "2007", PAGES = "15-20", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277073"} @inproceedings{bb282378, AUTHOR = "Ikeda, O.", TITLE = "Detection of a Speaker in Video by Combined Analysis of Speech Sound and Mouth Movement", BOOKTITLE = ISVC07, YEAR = "2007", PAGES = "II: 602-610", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277074"} @inproceedings{bb282379, AUTHOR = "Das, A.", TITLE = "Audio Visual Person Authentication by Multiple Nearest Neighbor Classifiers", BOOKTITLE = ICB07, YEAR = "2007", PAGES = "1114-1123", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277075"} @inproceedings{bb282380, AUTHOR = "Xin, L. and Tao, J.H. and Tan, T.N.", TITLE = "Dynamic Audio-Visual Mapping using Fused Hidden Markov Model Inversion Method", BOOKTITLE = ICIP07, YEAR = "2007", PAGES = "III: 293-296", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277076"} @inproceedings{bb282381, AUTHOR = "Barzelay, Z. and Schechner, Y.Y.", TITLE = "Harmony in Motion", BOOKTITLE = CVPR07, YEAR = "2007", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277077"} @inproceedings{bb282382, AUTHOR = "O'Donovan, A. and Duraiswami, R. and Neumann, J.", TITLE = "Microphone Arrays as Generalized Cameras for Integrated Audio Visual Processing", BOOKTITLE = CVPR07, YEAR = "2007", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277078"} @inproceedings{bb282383, AUTHOR = "Abbas, J. and Dagli, C.K. and Huang, T.S.", TITLE = "A Multimodality Framework for Creating Speaker/Non-Speaker Profile Databases for Real-World Video", BOOKTITLE = SLAM07, YEAR = "2007", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277079"} @inproceedings{bb282384, AUTHOR = "Monaci, G. and Vandergheynst, P.", TITLE = "Audiovisual Gestalts", BOOKTITLE = PercOrg06, YEAR = "2006", PAGES = "200", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277080"} @inproceedings{bb282385, AUTHOR = "Zhu, Z.G. and Li, W.H. and Molina, E. and Wolberg, G.", TITLE = "LDV Sensing and Processing for Remote Hearing in a Multimodal Surveillance System", BOOKTITLE = MSCSAS07, YEAR = "2007", PAGES = "1-2", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277081"} @inproceedings{bb282386, AUTHOR = "Zhu, Z.G. and Li, W.H. and Wolberg, G.", TITLE = "Integrating LDV Audio and IR Video for Remote Multimodal Surveillance", BOOKTITLE = OTCBVS05, YEAR = "2005", PAGES = "III: 10-10", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277082"} @inproceedings{bb282387, AUTHOR = "Wu, Z.Y. and Cai, L.H. and Meng, H.", TITLE = "Multi-level Fusion of Audio and Visual Features for Speaker Identification", BOOKTITLE = ICB06, YEAR = "2006", PAGES = "493-499", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277083"} @inproceedings{bb282388, AUTHOR = "Yang, P. and Yang, Y.C. and Wu, Z.H.", TITLE = "Exploiting Glottal Information in Speaker Recognition Using Parallel GMMs", BOOKTITLE = AVBPA05, YEAR = "2005", PAGES = "804", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277084"} @inproceedings{bb282389, AUTHOR = "Lei, Z.C.", TITLE = "Combining the Likelihood and the Kullback-Leibler Distance in Estimating the Universal Background Model for Speaker Verification Using SVM", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "4553-4556", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277085"} @inproceedings{bb282390, AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.", TITLE = "An UBM-Based Reference Space for Speaker Recognition", BOOKTITLE = ICPR06, YEAR = "2006", PAGES = "IV: 318-321", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277086"} @inproceedings{bb282391, AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.", TITLE = "Constructing the Discriminative Kernels Using GMM for Text-Independent Speaker Identification", BOOKTITLE = IWBRS05, YEAR = "2005", PAGES = "165", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277087"} @inproceedings{bb282392, AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.", TITLE = "Speaker Identification Using the VQ-Based Discriminative Kernels", BOOKTITLE = AVBPA05, YEAR = "2005", PAGES = "797", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277088"} @inproceedings{bb282393, AUTHOR = "Li, D.D. and Yang, Y.C. and Wu, Z.H.", TITLE = "Dynamic Bayesian Networks for Audio-Visual Speaker Recognition", BOOKTITLE = ICB06, YEAR = "2006", PAGES = "539-545", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277089"} @inproceedings{bb282394, AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.", TITLE = "VALID: A New Practical Audio-Visual Database, and Comparative Results", BOOKTITLE = AVBPA05, YEAR = "2005", PAGES = "777", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277090"} @book{bb282395, AUTHOR = "Sharma, P. and Reilly, R.B.", TITLE = "The UCD Colour Face Image Database for Face Detection", PUBLISHER = "Online", YEAR = "1998", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277091"} @inproceedings{bb282396, AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.", TITLE = "Audio-Visual Speaker Identification via Adaptive Fusion Using Reliability Estimates of Both Modalities", BOOKTITLE = AVBPA05, YEAR = "2005", PAGES = "787", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277092"} @inproceedings{bb282397, AUTHOR = "Zhang, D. and Ghobakhlou, A. and Kasabov, N.", TITLE = "An adaptive model of person identification combining speech and image information", BOOKTITLE = ICARCV04, YEAR = "2004", PAGES = "I: 413-418", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277093"} @inproceedings{bb282398, AUTHOR = "Kratt, J. and Metze, F. and Stiefelhagen, R. and Waibel, A.", TITLE = "Large Vocabulary Audio-Visual Speech Recognition Using the Janus Speech Recognition Toolkit", BOOKTITLE = DAGM04, YEAR = "2004", PAGES = "488-495", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277094"} @inproceedings{bb282399, AUTHOR = "Hanafiah, Z.M. and Yamazaki, C. and Nakamura, A. and Kuno, Y.", TITLE = "Understanding inexplicit utterances using vision for helper robots", BOOKTITLE = ICPR04, YEAR = "2004", PAGES = "IV: 925-928", BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT277095"}