@inproceedings{bb287500,
        AUTHOR = "Meng, D. and Peng, X. and Wang, K. and Qiao, Y.",
        TITLE = "Frame Attention Networks for Facial Expression Recognition in Videos",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3866-3870",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282137"}

@inproceedings{bb287501,
        AUTHOR = "Shahid, M. and Beyan, C. and Murino, V.",
        TITLE = "Comparisons of Visual Activity Primitives for Voice Activity Detection",
        BOOKTITLE = CIAP19,
        YEAR = "2019",
        PAGES = "I:48-59",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282138"}

@inproceedings{bb287502,
        AUTHOR = "Kim, C.I. and Shin, H.J.V. and Oh, T.H. and Kaspar, A. and Elgharib, M. and Matusik, W.",
        TITLE = "On Learning Associations of Faces and Voices",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "V:276-292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282139"}

@inproceedings{bb287503,
        AUTHOR = "Schindler, A. and Boyer, M. and Lindley, A. and Schreiber, D. and Philipp, T.",
        TITLE = "Large Scale Audio-Visual Video Analytics Platform for Forensic
Investigations of Terroristic Attacks",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "II:106-119",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282140"}

@inproceedings{bb287504,
        AUTHOR = "Oliveira, D.A.B. and Mattos, A.B. and da Silva Morais, E.",
        TITLE = "Improving Viseme Recognition Using GAN-Based Frontal View Mapping",
        BOOKTITLE = AMFG18,
        YEAR = "2018",
        PAGES = "2229-22297",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282141"}

@inproceedings{bb287505,
        AUTHOR = "Yang, X. and Molchanov, P. and Kautz, J.",
        TITLE = "Making Convolutional Networks Recurrent for Visual Sequence Learning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6469-6478",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282142"}

@inproceedings{bb287506,
        AUTHOR = "Zhang, J. and Richmond, K. and Fisher, R.B.",
        TITLE = "Dual-modality Talking-metrics: 3D Visual-Audio Integrated
Behaviometric Cues from Speakers",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3144-3149",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282143"}

@inproceedings{bb287507,
        AUTHOR = "Chowdhury, A. and Atoum, Y. and Tran, L. and Liu, X. and Ross, A.",
        TITLE = "MSU-AVIS dataset: Fusing Face and Voice Modalities for Biometric
Recognition in Indoor Surveillance Videos",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3567-3573",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282144"}

@inproceedings{bb287508,
        AUTHOR = "Nagrani, A. and Albanie, S. and Zisserman, A.",
        TITLE = "Seeing Voices and Hearing Faces: Cross-Modal Biometric Matching",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "8427-8436",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282145"}

@inproceedings{bb287509,
        AUTHOR = "Saitoh, T. and Kubokawa, M.",
        TITLE = "SSSD: Speech Scene database by Smart Device for Visual Speech
Recognition",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3228-3232",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282146"}

@inproceedings{bb287510,
        AUTHOR = "Owens, A. and Efros, A.A.",
        TITLE = "Audio-Visual Scene Analysis with Self-Supervised Multisensory Features",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 639-658",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282147"}

@inproceedings{bb287511,
        AUTHOR = "Berlin, A.A. and Surati, R.",
        TITLE = "Video Deconfounding: Hearing-Aid Inspired Video Enhancement",
        BOOKTITLE = IVMSP18,
        YEAR = "2018",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282148"}

@inproceedings{bb287512,
        AUTHOR = "Ding, R. and Pang, C. and Liu, H.",
        TITLE = "Audio-Visual Keyword Spotting Based on Multidimensional Convolutional
Neural Network",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "4138-4142",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282149"}

@inproceedings{bb287513,
        AUTHOR = "Liao, J. and Wang, S. and Zhang, X. and Liu, G.",
        TITLE = "3D Convolutional Neural Networks Based Speaker Identification and
Authentication",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2042-2046",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282150"}

@inproceedings{bb287514,
        AUTHOR = "Savran, A. and Tavarone, R. and Higy, B. and Badino, L. and Bartolozzi, C.",
        TITLE = "Energy and Computation Efficient Audio-Visual Voice Activity
Detection Driven by Event-Cameras",
        BOOKTITLE = FG18,
        YEAR = "2018",
        PAGES = "333-340",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282151"}

@inproceedings{bb287515,
        AUTHOR = "Ephrat, A. and Halperin, T. and Peleg, S.",
        TITLE = "Improved Speech Reconstruction from Silent Video",
        BOOKTITLE = CVAVM17,
        YEAR = "2017",
        PAGES = "455-462",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282152"}

@inproceedings{bb287516,
        AUTHOR = "Ahn, J. and Kim, Y.J. and Kim, D.J.",
        TITLE = "Patch-based visual microphone for improving quality of sound",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "3927-3932",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282153"}

@inproceedings{bb287517,
        AUTHOR = "Miao, C.L. and Feng, J.W. and Ding, Y. and Yang, Y. and Chen, X.G. and Ji, X.Y.",
        TITLE = "Unsupervised person clustering in videos with cross-modal
communication",
        BOOKTITLE = VCIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282154"}

@inproceedings{bb287518,
        AUTHOR = "Hu, D. and Li, X.L. and Lu, X.Q.",
        TITLE = "Temporal Multimodal Learning in Audiovisual Speech Recognition",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "3574-3582",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282155"}

@inproceedings{bb287519,
        AUTHOR = "Liu, H. and Fan, T. and Wu, P.P.",
        TITLE = "Audio-visual Keyword Spotting for Mandarin Based on Discriminative
Local Spatial-Temporal Descriptors",
        BOOKTITLE = ICPR14,
        YEAR = "2014",
        PAGES = "785-790",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282156"}

@inproceedings{bb287520,
        AUTHOR = "Ringeval, F. and Sonderegger, A. and Sauer, J. and Lalanne, D.",
        TITLE = "Introducing the RECOLA multimodal corpus of remote collaborative and
affective interactions",
        BOOKTITLE = FG13,
        YEAR = "2013",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282157"}

@inproceedings{bb287521,
        AUTHOR = "Aubrey, A.J. and Cunningham, D.W. and Marshall, D. and Rosin, P.L. and Shin, A.",
        TITLE = "The Face Speaks:
Contextual and Temporal Sensitivity to Backchannel Responses",
        BOOKTITLE = FaceCVHum12,
        YEAR = "2012",
        PAGES = "II:248-259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282158"}

@inproceedings{bb287522,
        AUTHOR = "Tawari, A. and Trivedi, M.",
        TITLE = "Audio-visual data association for face expression analysis",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "1120-1123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282159"}

@inproceedings{bb287523,
        AUTHOR = "Taj, M. and Cavallaro, A.",
        TITLE = "Interaction recognition in wide areas using audiovisual sensors",
        BOOKTITLE = ICIP12,
        YEAR = "2012",
        PAGES = "1113-1116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282160"}

@inproceedings{bb287524,
        AUTHOR = "Giorgolo, G.",
        TITLE = "Integration of Gesture and Verbal Language: A Formal Semantics Approach",
        BOOKTITLE = GW11,
        YEAR = "2011",
        PAGES = "216-227",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282161"}

@inproceedings{bb287525,
        AUTHOR = "Le, Q.A. and Pelachaud, C.",
        TITLE = "Generating Co-speech Gestures for the Humanoid Robot NAO through BML",
        BOOKTITLE = GW11,
        YEAR = "2011",
        PAGES = "228-237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282162"}

@inproceedings{bb287526,
        AUTHOR = "Navarathna, R. and Dean, D. and Sridharan, S. and Fookes, C. and Lucey, P.",
        TITLE = "Visual Voice Activity Detection Using Frontal versus Profile Views",
        BOOKTITLE = DICTA11,
        YEAR = "2011",
        PAGES = "134-139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282163"}

@inproceedings{bb287527,
        AUTHOR = "Komai, Y. and Ariki, Y. and Takiguchi, T.",
        TITLE = "Audio-Visual Speech Recognition Based on AAM Parameter and Phoneme
Analysis of Visual Feature",
        BOOKTITLE = PSIVT11,
        YEAR = "2011",
        PAGES = "I: 97-108",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282164"}

@inproceedings{bb287528,
        AUTHOR = "Zheng, H.M. and Wang, M. and Li, Z.",
        TITLE = "Audio-visual speaker identification with multi-view distance metric
learning",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "4561-4564",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282165"}

@inproceedings{bb287529,
        AUTHOR = "Krishnan, R.K. and Sarkar, S.",
        TITLE = "Similarity Measure between Two Gestures Using Triplets",
        BOOKTITLE = HAU3D13,
        YEAR = "2013",
        PAGES = "506-513",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282166"}

@inproceedings{bb287530,
        AUTHOR = "Krishnan, R.K. and Sarkar, S.",
        TITLE = "Detecting Group Turn Patterns in Conversations Using Audio-Video Change
Scale-Space",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "137-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282167"}

@inproceedings{bb287531,
        AUTHOR = "Aran, O. and Gatica Perez, D.",
        TITLE = "Fusing Audio-Visual Nonverbal Cues to Detect Dominant People in Group
Conversations",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "3687-3690",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282168"}

@inproceedings{bb287532,
        AUTHOR = "Niese, R. and Al Hamadi, A. and Michaelis, B.",
        TITLE = "A New Multi-camera Based Facial Expression Analysis Concept",
        BOOKTITLE = ICIAR12,
        YEAR = "2012",
        PAGES = "II: 64-71",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282169"}

@inproceedings{bb287533,
        AUTHOR = "Steer, M.A. and Al Hamadi, A. and Michaelis, B.",
        TITLE = "Audio-Visual Data Fusion Using a Particle Filter in the Application of
Face Recognition",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4392-4395",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282170"}

@inproceedings{bb287534,
        AUTHOR = "Roy, A. and Marcel, S.",
        TITLE = "Crossmodal Matching of Speakers Using Lip and Voice Features in
Temporally Non-overlapping Audio and Video Streams",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4504-4507",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282171"}

@inproceedings{bb287535,
        AUTHOR = "Cour, T. and Sapp, B. and Nagle, A. and Taskar, B.",
        TITLE = "Talking pictures:
Temporal grouping and dialog-supervised person recognition",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "1014-1021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282172"}

@inproceedings{bb287536,
        AUTHOR = "Wu, G.Y. and Zhu, J. and Xu, H.H.",
        TITLE = "A hybrid visual feature extraction method for audio-visual speech
recognition",
        BOOKTITLE = ICIP09,
        YEAR = "2009",
        PAGES = "1829-1832",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282173"}

@inproceedings{bb287537,
        AUTHOR = "Ceballos, A. and Gomez, J. and Prieto, F. and Redarce, T.",
        TITLE = "Robot Command Interface Using an Audio-Visual Speech Recognition System",
        BOOKTITLE = CIARP09,
        YEAR = "2009",
        PAGES = "869-876",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282174"}

@inproceedings{bb287538,
        AUTHOR = "Cifani, S. and Abel, A. and Hussain, A. and Squartini, S. and Piazza, F.",
        TITLE = "An Investigation into Audiovisual Speech Correlation in Reverberant
Noisy Environments",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "331-343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282175"}

@inproceedings{bb287539,
        AUTHOR = "Lee, J.S. and Ebrahimi, T.",
        TITLE = "Two-Level Bimodal Association for Audio-Visual Speech Recognition",
        BOOKTITLE = ACIVS09,
        YEAR = "2009",
        PAGES = "133-144",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282176"}

@inproceedings{bb287540,
        AUTHOR = "Marchegiani, M.L. and Pirri, F. and Pizzoli, M.",
        TITLE = "Multimodal Speaker Recognition in a Conversation Scenario",
        BOOKTITLE = CVS09,
        YEAR = "2009",
        PAGES = "11-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282177"}

@inproceedings{bb287541,
        AUTHOR = "Karam, W. and Mokbel, C. and Greige, H. and Chollet, G.",
        TITLE = "Audio-Visual Identity Verification and Robustness to Imposture",
        BOOKTITLE = ICB09,
        YEAR = "2009",
        PAGES = "796-805",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282178"}

@inproceedings{bb287542,
        AUTHOR = "Rebillat, M. and Katz, B.F.G. and Corteel, E.",
        TITLE = "SMART-I2: Spatial Multi-user Audio-visual Real-time interactive
interface, A broadcast application context",
        BOOKTITLE = "3DTV09",
        YEAR = "2009",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282179"}

@inproceedings{bb287543,
        AUTHOR = "Eisenstein, J.",
        TITLE = "Gesture in Automatic Discourse Processing",
        BOOKTITLE = CSAIL,
        YEAR = "2008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282180"}

@inproceedings{bb287544,
        AUTHOR = "Eisenstein, J.",
        TITLE = "Gesture in Automatic Discourse Processing",
        BOOKTITLE = Ph.D.,
        YEAR = "2008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282180"}

@inproceedings{bb287545,
        AUTHOR = "Das, A. and Manyam, O.K. and Tapaswi, M.",
        TITLE = "Audio-Visual Person Authentication with Multiple Visualized-Speech
Features and Multiple Face Profiles",
        BOOKTITLE = ICCVGIP08,
        YEAR = "2008",
        PAGES = "39-46",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282181"}

@inproceedings{bb287546,
        AUTHOR = "Cao, Y. and Baang, S. and Liu, S.H. and Li, M. and Hu, S.Q.",
        TITLE = "Audio-visual event classification via spatial-temporal-audio words",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282182"}

@inproceedings{bb287547,
        AUTHOR = "Terry, L.H. and Shiell, D.J. and Katsaggelos, A.K.",
        TITLE = "Feature space video stream consistency estimation for dynamic stream
weighting in audio-visual speech recognition",
        BOOKTITLE = ICIP08,
        YEAR = "2008",
        PAGES = "1316-1319",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282183"}

@inproceedings{bb287548,
        AUTHOR = "Naseem, I. and Mian, A.S.",
        TITLE = "User Verification by Combining Speech and Face Biometrics in Video",
        BOOKTITLE = ISVC08,
        YEAR = "2008",
        PAGES = "II: 482-492",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282184"}

@inproceedings{bb287549,
        AUTHOR = "Ettinger, E. and Freund, Y.",
        TITLE = "Coordinate-free calibration of an acoustically driven camera pointing
system",
        BOOKTITLE = ICDSC08,
        YEAR = "2008",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282185"}

@inproceedings{bb287550,
        AUTHOR = "Hung, H. and Friedland, G.",
        TITLE = "Towards Audio-Visual On-line Diarization Of Participants In Group
Meetings",
        BOOKTITLE = M2SFA208,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282186"}

@inproceedings{bb287551,
        AUTHOR = "Liu, Y.Y. and Sato, Y.",
        TITLE = "Finding Speaker Face Region by Audiovisual Correlation",
        BOOKTITLE = M2SFA208,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282187"}

@inproceedings{bb287552,
        AUTHOR = "Pachoud, S. and Gong, S. and Cavallaro, A.",
        TITLE = "Video Augmentation for Improving Audio Speech Recognition under Noise",
        BOOKTITLE = BMVC08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282188"}

@inproceedings{bb287553,
        AUTHOR = "Horii, Y. and Kawashima, H. and Matsuyama, T.",
        TITLE = "Speaker detection using the timing structure of lip motion and sound",
        BOOKTITLE = CVPR4HB08,
        YEAR = "2008",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282189"}

@inproceedings{bb287554,
        AUTHOR = "Rua, E.A. and Castro, J.L.A. and Mateo, C.G.",
        TITLE = "Quality-Based Score Normalization for Audiovisual Person Authentication",
        BOOKTITLE = ICIAR08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282190"}

@inproceedings{bb287555,
        AUTHOR = "Wang, L. and Tjondrongoro, D. and Liu, Y.",
        TITLE = "Clustering and Visualizing Audio-Visual Dataset on Mobile Devices in a
Topic-Oriented Manner",
        BOOKTITLE = Visual07,
        YEAR = "2007",
        PAGES = "310-321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282191"}

@inproceedings{bb287556,
        AUTHOR = "Zajdel, W. and Krijnders, J.D. and Andringa, T. and Gavrila, D.M.",
        TITLE = "CASSANDRA: audio-video sensor fusion for aggression detection",
        BOOKTITLE = AVSBS07,
        YEAR = "2007",
        PAGES = "200-205",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282192"}

@inproceedings{bb287557,
        AUTHOR = "Stodle, D. and Bjorndalen, J.M. and Anshus, O.J.",
        TITLE = "A System for Hybrid Vision- and Sound-Based Interaction with Distal and
Proximal Targets on Wall-Sized, High-Resolution Tiled Displays",
        BOOKTITLE = CVHCI07,
        YEAR = "2007",
        PAGES = "59-68",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282193"}

@inproceedings{bb287558,
        AUTHOR = "van Hengel, P.W.J. and Andringa, T.C.",
        TITLE = "Verbal aggression detection in complex social environments",
        BOOKTITLE = AVSBS07,
        YEAR = "2007",
        PAGES = "15-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282194"}

@inproceedings{bb287559,
        AUTHOR = "Ikeda, O.",
        TITLE = "Detection of a Speaker in Video by Combined Analysis of Speech Sound
and Mouth Movement",
        BOOKTITLE = ISVC07,
        YEAR = "2007",
        PAGES = "II: 602-610",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282195"}

@inproceedings{bb287560,
        AUTHOR = "Das, A.",
        TITLE = "Audio Visual Person Authentication by Multiple Nearest Neighbor
Classifiers",
        BOOKTITLE = ICB07,
        YEAR = "2007",
        PAGES = "1114-1123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282196"}

@inproceedings{bb287561,
        AUTHOR = "Xin, L. and Tao, J.H. and Tan, T.N.",
        TITLE = "Dynamic Audio-Visual Mapping using Fused Hidden Markov Model Inversion
Method",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "III: 293-296",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282197"}

@inproceedings{bb287562,
        AUTHOR = "Barzelay, Z. and Schechner, Y.Y.",
        TITLE = "Harmony in Motion",
        BOOKTITLE = CVPR07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282198"}

@inproceedings{bb287563,
        AUTHOR = "O'Donovan, A. and Duraiswami, R. and Neumann, J.",
        TITLE = "Microphone Arrays as Generalized Cameras for Integrated Audio Visual
Processing",
        BOOKTITLE = CVPR07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282199"}

@inproceedings{bb287564,
        AUTHOR = "Abbas, J. and Dagli, C.K. and Huang, T.S.",
        TITLE = "A Multimodality Framework for Creating Speaker/Non-Speaker Profile
Databases for Real-World Video",
        BOOKTITLE = SLAM07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282200"}

@inproceedings{bb287565,
        AUTHOR = "Monaci, G. and Vandergheynst, P.",
        TITLE = "Audiovisual Gestalts",
        BOOKTITLE = PercOrg06,
        YEAR = "2006",
        PAGES = "200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282201"}

@inproceedings{bb287566,
        AUTHOR = "Zhu, Z.G. and Li, W.H. and Molina, E. and Wolberg, G.",
        TITLE = "LDV Sensing and Processing for Remote Hearing in a Multimodal
Surveillance System",
        BOOKTITLE = MSCSAS07,
        YEAR = "2007",
        PAGES = "1-2",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282202"}

@inproceedings{bb287567,
        AUTHOR = "Zhu, Z.G. and Li, W.H. and Wolberg, G.",
        TITLE = "Integrating LDV Audio and IR Video for Remote Multimodal Surveillance",
        BOOKTITLE = OTCBVS05,
        YEAR = "2005",
        PAGES = "III: 10-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282203"}

@inproceedings{bb287568,
        AUTHOR = "Wu, Z.Y. and Cai, L.H. and Meng, H.",
        TITLE = "Multi-level Fusion of Audio and Visual Features for Speaker
Identification",
        BOOKTITLE = ICB06,
        YEAR = "2006",
        PAGES = "493-499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282204"}

@inproceedings{bb287569,
        AUTHOR = "Yang, P. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Exploiting Glottal Information in Speaker Recognition Using Parallel
GMMs",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "804",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282205"}

@inproceedings{bb287570,
        AUTHOR = "Lei, Z.C.",
        TITLE = "Combining the Likelihood and the Kullback-Leibler Distance in
Estimating the Universal Background Model for Speaker Verification
Using SVM",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4553-4556",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282206"}

@inproceedings{bb287571,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "An UBM-Based Reference Space for Speaker Recognition",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "IV: 318-321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282207"}

@inproceedings{bb287572,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Constructing the Discriminative Kernels Using GMM for Text-Independent
Speaker Identification",
        BOOKTITLE = IWBRS05,
        YEAR = "2005",
        PAGES = "165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282208"}

@inproceedings{bb287573,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Speaker Identification Using the VQ-Based Discriminative Kernels",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "797",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282209"}

@inproceedings{bb287574,
        AUTHOR = "Li, D.D. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Dynamic Bayesian Networks for Audio-Visual Speaker Recognition",
        BOOKTITLE = ICB06,
        YEAR = "2006",
        PAGES = "539-545",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282210"}

@inproceedings{bb287575,
        AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.",
        TITLE = "VALID:
A New Practical Audio-Visual Database, and Comparative Results",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "777",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282211"}

@book{bb287576,
        AUTHOR = "Sharma, P. and Reilly, R.B.",
        TITLE = "The UCD Colour Face Image Database for Face Detection",
        PUBLISHER = "Online",
        YEAR = "1998",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282212"}

@inproceedings{bb287577,
        AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.",
        TITLE = "Audio-Visual Speaker Identification via Adaptive Fusion Using
Reliability Estimates of Both Modalities",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "787",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282213"}

@inproceedings{bb287578,
        AUTHOR = "Zhang, D. and Ghobakhlou, A. and Kasabov, N.",
        TITLE = "An adaptive model of person identification combining speech and image
information",
        BOOKTITLE = ICARCV04,
        YEAR = "2004",
        PAGES = "I: 413-418",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282214"}

@inproceedings{bb287579,
        AUTHOR = "Kratt, J. and Metze, F. and Stiefelhagen, R. and Waibel, A.",
        TITLE = "Large Vocabulary Audio-Visual Speech Recognition Using the Janus Speech
Recognition Toolkit",
        BOOKTITLE = DAGM04,
        YEAR = "2004",
        PAGES = "488-495",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282215"}

@inproceedings{bb287580,
        AUTHOR = "Hanafiah, Z.M. and Yamazaki, C. and Nakamura, A. and Kuno, Y.",
        TITLE = "Understanding inexplicit utterances using vision for helper robots",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "IV: 925-928",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282216"}

@inproceedings{bb287581,
        AUTHOR = "Hermann, T. and Henning, T. and Ritter, H.",
        TITLE = "Gesture Desk an Integrated Multi-modal Gestural Workplace
for Sonification",
        BOOKTITLE = GW03,
        YEAR = "2003",
        PAGES = "369-379",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282217"}

@inproceedings{bb287582,
        AUTHOR = "Merola, G.",
        TITLE = "The Effects of the Gesture Viewpoint on the Students' Memory of Words
and Stories",
        BOOKTITLE = GW07,
        YEAR = "2007",
        PAGES = "272-281",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282218"}

@inproceedings{bb287583,
        AUTHOR = "Merola, G. and Poggi, I.",
        TITLE = "Multimodality and Gestures in the Teacher's Communication",
        BOOKTITLE = GW03,
        YEAR = "2003",
        PAGES = "101-111",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282219"}

@inproceedings{bb287584,
        AUTHOR = "Kranstedt, A. and Kuhnlein, P. and Wachsmuth, I.",
        TITLE = "Deixis in Multimodal Human Computer Interaction:
An Interdisciplinary Approach",
        BOOKTITLE = GW03,
        YEAR = "2003",
        PAGES = "112-123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282220"}

@inproceedings{bb287585,
        AUTHOR = "Saeed, K. and Kozlowski, M.",
        TITLE = "An Image-Based System for Spoken-Letter Recognition",
        BOOKTITLE = CAIP03,
        YEAR = "2003",
        PAGES = "494-502",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282221"}

@inproceedings{bb287586,
        AUTHOR = "Ho, P. and Armington, J.",
        TITLE = "A Dual-Factor Authentication System Featuring Speaker Verification and
Token Technology",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "128-136",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282222"}

@inproceedings{bb287587,
        AUTHOR = "Fox, N.A. and Reilly, R.B.",
        TITLE = "Audio-Visual Speaker Identification Based on the Use of Dynamic Audio
and Visual Features",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "743-751",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282223"}

@inproceedings{bb287588,
        AUTHOR = "Czyz, J. and Bengio, S. and Marcel, C. and Vandendorpe, L.",
        TITLE = "Scalability Analysis of Audio-Visual Person Identity Verification",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "752-760",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282224"}

@inproceedings{bb287589,
        AUTHOR = "Bengio, S.",
        TITLE = "Multimodal Authentication Using Asynchronous HMMs",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "770-777",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282225"}

@inproceedings{bb287590,
        AUTHOR = "Lucey, S. and Chen, T.H.",
        TITLE = "Improved Audio-Visual Speaker Recognition via the Use of a Hybrid
Combination Strategy",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "929-936",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282226"}

@inproceedings{bb287591,
        AUTHOR = "Krahnstoever, N. and Schapira, E. and Kettebeko, S. and Sharma, R.",
        TITLE = "Multimodal human-computer interaction for crisis management systems",
        BOOKTITLE = WACV02,
        YEAR = "2002",
        PAGES = "203-207",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282227"}

@inproceedings{bb287592,
        AUTHOR = "Kettebekov, S. and Yeasin, M. and Sharma, R.",
        TITLE = "Improving continuous gesture recognition with spoken prosody",
        BOOKTITLE = CVPR03,
        YEAR = "2003",
        PAGES = "I: 565-570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282228"}

@inproceedings{bb287593,
        AUTHOR = "Poh, N. and Korczak, J.",
        TITLE = "Hybrid Biometric Person Authentication Using Face and Voice Features",
        BOOKTITLE = AVBPA01,
        YEAR = "2001",
        PAGES = "348",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282229"}

@inproceedings{bb287594,
        AUTHOR = "Nakamura, S.",
        TITLE = "Fusion of Audio-Visual Information for Integrated Speech Processing",
        BOOKTITLE = AVBPA01,
        YEAR = "2001",
        PAGES = "127",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282230"}

@inproceedings{bb287595,
        AUTHOR = "Sullivan, K.P.H. and Pelecanos, J.",
        TITLE = "Revisiting Carl Bildt's Impostor: Would a Speaker Verification System
Foil Him?",
        BOOKTITLE = AVBPA01,
        YEAR = "2001",
        PAGES = "144",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282231"}

@inproceedings{bb287596,
        AUTHOR = "Geiger, G. and Ezzat, T. and Poggio, T.",
        TITLE = "Perceptual Evaluation of Video-Realistic Speech",
        BOOKTITLE = "MIT AIM",
        YEAR = "2003",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282232"}

@inproceedings{bb287597,
        AUTHOR = "Zhang, X.Z. and Merserratt, R.M. and Clements, M.",
        TITLE = "Bimodal fusion in audio-visual speech recognition",
        BOOKTITLE = ICIP02,
        YEAR = "2002",
        PAGES = "I: 964-967",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282233"}

@inproceedings{bb287598,
        AUTHOR = "Graf, H.P. and Cosatto, E. and Strom, V. and Huang, F.J.",
        TITLE = "Visual prosody: facial movements accompanying speech",
        BOOKTITLE = AFGR02,
        YEAR = "2002",
        PAGES = "381-386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282234"}

@inproceedings{bb287599,
        AUTHOR = "Qi, Y.",
        TITLE = "Learning Algorithms for Audio and Video Processing: 
Independent Component Analysis and Support Vector Machine Based Approaches",
        BOOKTITLE = UMD,
        YEAR = "2000",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT282235"}

Last update:Jan 16, 2026 at 20:03:35