@inproceedings{bb109400,
        AUTHOR = "Liang, B. and Pan, Y. and Guo, Z.Z. and Zhou, H. and Hong, Z.B. and Han, X.G. and Han, J.Y. and Liu, J.T. and Ding, E. and Wang, J.D.",
        TITLE = "Expressive Talking Head Generation with Granular Audio-Visual Control",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "3377-3386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106074"}

@inproceedings{bb109401,
        AUTHOR = "Fan, Y.R. and Lin, Z.J. and Saito, J. and Wang, W.P. and Komura, T.",
        TITLE = "FaceFormer: Speech-Driven 3D Facial Animation with Transformers",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "18749-18758",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106075"}

@inproceedings{bb109402,
        AUTHOR = "Liu, X. and Wu, Q.Y. and Zhou, H. and Xu, Y.H. and Qian, R. and Lin, X.Y. and Zhou, X.W. and Wu, W. and Dai, B. and Zhou, B.",
        TITLE = "Learning Hierarchical Cross-Modal Association for Co-Speech Gesture
Generation",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10452-10462",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106076"}

@inproceedings{bb109403,
        AUTHOR = "Medina, S. and Tome, D. and Stoll, C. and Tiede, M. and Munhall, K. and Hauptmann, A. and Matthews, I.",
        TITLE = "Speech Driven Tongue Animation",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "20374-20384",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106077"}

@inproceedings{bb109404,
        AUTHOR = "Song, H.K. and Woo, S.H. and Lee, J. and Yang, S.M. and Cho, H. and Lee, Y. and Choi, D. and Kim, K.W.",
        TITLE = "Talking Face Generation with Multilingual TTS",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "21393-21398",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106078"}

@inproceedings{bb109405,
        AUTHOR = "Richard, A. and Zollhofer, M. and Wen, Y.D. and de la Torre, F. and Sheikh, Y.",
        TITLE = "MeshTalk: 3D Face Animation from Speech using Cross-Modality
Disentanglement",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "1153-1162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106079"}

@inproceedings{bb109406,
        AUTHOR = "Zhang, C.X. and Zhao, Y.F. and Huang, Y.F. and Zeng, M. and Ni, S.F. and Budagavi, M. and Guo, X.H.",
        TITLE = "FACIAL: Synthesizing Dynamic Talking Face with Implicit Attribute
Learning",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "3847-3856",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106080"}

@inproceedings{bb109407,
        AUTHOR = "Guo, Y.D. and Chen, K.Y. and Liang, S. and Liu, Y.J. and Bao, H.J. and Zhang, J.Y.",
        TITLE = "AD-NeRF: Audio Driven Neural Radiance Fields for Talking Head
Synthesis",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "5764-5774",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106081"}

@inproceedings{bb109408,
        AUTHOR = "Meshry, M. and Suri, S. and Davis, L.S. and Shrivastava, A.",
        TITLE = "Learned Spatial Representations for Few-shot Talking-Head Synthesis",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13809-13818",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106082"}

@inproceedings{bb109409,
        AUTHOR = "Wang, Q.L. and Zhang, L. and Li, B.",
        TITLE = "SAFA: Structure Aware Face Animation",
        BOOKTITLE = "3DV21",
        YEAR = "2021",
        PAGES = "679-688",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106083"}

@inproceedings{bb109410,
        AUTHOR = "Zhou, H. and Sun, Y.S. and Wu, W. and Loy, C.C. and Wang, X.G. and Liu, Z.W.",
        TITLE = "Pose-Controllable Talking Face Generation by Implicitly Modularized
Audio-Visual Representation",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "4174-4184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106084"}

@inproceedings{bb109411,
        AUTHOR = "Ye, S.Q. and Han, C. and Lin, J.Y. and Han, G.Q. and He, S.F.",
        TITLE = "Coherence and Identity Learning for Arbitrary-length Face Video
Generation",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "915-922",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106085"}

@inproceedings{bb109412,
        AUTHOR = "Liang, H. and Yu, L. and Xu, G. and Raj, B. and Singh, R.",
        TITLE = "Controlled Autoencoders to Generate Faces from Voices",
        BOOKTITLE = ISVC20,
        YEAR = "2020",
        PAGES = "I:476-487",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106086"}

@inproceedings{bb109413,
        AUTHOR = "Liao, M. and Zhang, S. and Wang, P. and Zhu, H. and Zuo, X. and Yang, R.G.",
        TITLE = "Speech2video Synthesis with 3d Skeleton Regularization and Expressive
Body Poses",
        BOOKTITLE = ACCV20,
        YEAR = "2020",
        PAGES = "V:308-323",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106087"}

@inproceedings{bb109414,
        AUTHOR = "Xue, H. and Ling, J. and Song, L. and Xie, R. and Zhang, W.",
        TITLE = "Realistic Talking Face Synthesis With Geometry-Aware Feature
Transformation",
        BOOKTITLE = ICIP20,
        YEAR = "2020",
        PAGES = "1581-1585",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106088"}

@inproceedings{bb109415,
        AUTHOR = "Chen, L. and Cui, G.F. and Liu, C.L. and Li, Z. and Kou, Z. and Xu, Y. and Xu, C.L.",
        TITLE = "Talking-head Generation with Rhythmic Head Motion",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "IX:35-51",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106089"}

@inproceedings{bb109416,
        AUTHOR = "Khakhulin, T. and Sklyarova, V. and Lempitsky, V. and Zakharov, E.",
        TITLE = "Realistic One-Shot Mesh-Based Head Avatars",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "II:345-362",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106090"}

@inproceedings{bb109417,
        AUTHOR = "Zakharov, E. and Ivakhnenko, A. and Shysheya, A. and Lempitsky, V.",
        TITLE = "Fast Bi-layer Neural Synthesis of One-shot Realistic Head Avatars",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XII: 524-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106091"}

@inproceedings{bb109418,
        AUTHOR = "Chu, H. and Ma, S.G. and de la Torre, F. and Fidler, S. and Sheikh, Y.",
        TITLE = "Expressive Telepresence via Modular Codec Avatars",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XII: 330-345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106092"}

@inproceedings{bb109419,
        AUTHOR = "Thies, J. and Elgharib, M. and Tewari, A. and Theobalt, C. and Nießner, M.",
        TITLE = "Neural Voice Puppetry: Audio-driven Facial Reenactment",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XVI: 716-731",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106093"}

@inproceedings{bb109420,
        AUTHOR = "Pang, W. and Wang, X.J.",
        TITLE = "Guessing State Tracking for Visual Dialogue",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XVI: 683-698",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106094"}

@inproceedings{bb109421,
        AUTHOR = "Das, D. and Biswas, S. and Sinha, S. and Bhowmick, B.",
        TITLE = "Speech-driven Facial Animation Using Cascaded Gans for Learning of
Motion and Texture",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXX: 408-424",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106095"}

@inproceedings{bb109422,
        AUTHOR = "Shalev, Y. and Wolf, L.B.",
        TITLE = "Image Animation with Perturbed Masks",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "3637-3646",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106096"}

@inproceedings{bb109423,
        AUTHOR = "Mittal, G. and Wang, B.",
        TITLE = "Animating Face using Disentangled Audio Representations",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "3279-3287",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106097"}

@inproceedings{bb109424,
        AUTHOR = "Chen, Z. and Liu, Z. and Hu, H. and Bai, J. and Lian, S. and Shi, F. and Wang, K.",
        TITLE = "A Realistic Face-to-Face Conversation System Based on Deep Neural
Networks",
        BOOKTITLE = ACVR19,
        YEAR = "2019",
        PAGES = "2575-2583",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106098"}

@inproceedings{bb109425,
        AUTHOR = "Zakharov, E. and Shysheya, A. and Burkov, E. and Lempitsky, V.",
        TITLE = "Few-Shot Adversarial Learning of Realistic Neural Talking Head Models",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "9458-9467",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106099"}

@inproceedings{bb109426,
        AUTHOR = "Cudeiro, D. and Bolkart, T. and Laidlaw, C. and Ranjan, A. and Black, M.J.",
        TITLE = "Capture, Learning, and Synthesis of 3D Speaking Styles",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10093-10103",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106100"}

@inproceedings{bb109427,
        AUTHOR = "Chen, L. and Maddox, R.K. and Duan, Z.Y. and Xu, C.L.",
        TITLE = "Hierarchical Cross-Modal Talking Face Generation With Dynamic
Pixel-Wise Loss",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "7824-7833",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106101"}

@inproceedings{bb109428,
        AUTHOR = "Chu, H. and Li, D.Q. and Fidler, S.",
        TITLE = "A Face-to-Face Neural Conversation Model",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7113-7121",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106102"}

@inproceedings{bb109429,
        AUTHOR = "Afouras, T. and Asano, Y.M. and Fagan, F. and Vedaldi, A. and Metze, F.",
        TITLE = "Self-supervised object detection from audio-visual correspondence",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10565-10576",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106103"}

@inproceedings{bb109430,
        AUTHOR = "Feng, C. and Chen, Z.Y. and Owens, A.",
        TITLE = "Self-Supervised Video Forensics by Audio-Visual Anomaly Detection",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "10491-10503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106104"}

@inproceedings{bb109431,
        AUTHOR = "Afouras, T. and Owens, A. and Chung, J.S. and Zisserman, A.",
        TITLE = "Self-supervised Learning of Audio-visual Objects from Video",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XVIII:208-224",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106105"}

@inproceedings{bb109432,
        AUTHOR = "Wiles, O. and Koepke, A.S. and Zisserman, A.",
        TITLE = "Self-Supervised Learning of Class Embeddings from Video",
        BOOKTITLE = CEFRL19,
        YEAR = "2019",
        PAGES = "3019-3027",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106106"}

@inproceedings{bb109433,
        AUTHOR = "Wiles, O. and Koepke, A.S. and Zisserman, A.",
        TITLE = "X2Face: A Network for Controlling Face Generation Using Images, Audio,
and Pose Codes",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIII: 690-706",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106107"}

@inproceedings{bb109434,
        AUTHOR = "Modrzejewski, M. and Rokita, P.",
        TITLE = "Graphical Interface Design for Chatbots for the Needs of Artificial
Intelligence Support in Web and Mobile Applications",
        BOOKTITLE = ICCVG18,
        YEAR = "2018",
        PAGES = "48-56",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106108"}

@inproceedings{bb109435,
        AUTHOR = "Nakatani, S. and Saiki, S. and Nakamura, M. and Yasuda, K.",
        TITLE = "Generating Personalized Virtual Agent in Speech Dialogue System for
People with Dementia",
        BOOKTITLE = DHM18,
        YEAR = "2018",
        PAGES = "326-337",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106109"}

@inproceedings{bb109436,
        AUTHOR = "Huber, B. and McDuff, D.",
        TITLE = "Facial Expression Grounded Conversational Dialogue Generation",
        BOOKTITLE = FG18,
        YEAR = "2018",
        PAGES = "365-372",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106110"}

@inproceedings{bb109437,
        AUTHOR = "Luo, C. and Yu, J. and Li, X. and Zhang, L.",
        TITLE = "HMM based speech-driven 3D tongue animation",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "4377-4381",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106111"}

@inproceedings{bb109438,
        AUTHOR = "Filntisis, P.P. and Katsamanis, A. and Maragos, P.",
        TITLE = "Photorealistic adaptation and interpolation of facial expressions
using HMMS and AAMS for audio-visual speech synthesis",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "2941-2945",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106112"}

@inproceedings{bb109439,
        AUTHOR = "Filntisis, P.P. and Katsamanis, A. and Maragos, P.",
        TITLE = "Demonstration of an HMM-based photorealistic expressive audio-visual
speech synthesis system",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "4588-4588",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106113"}

@inproceedings{bb109440,
        AUTHOR = "Wang, Y.B. and Khoo, E.T.",
        TITLE = "Real-time stereoscopic rendering of realistic avatar for interactive
3D telepresence system",
        BOOKTITLE = ICIVC17,
        YEAR = "2017",
        PAGES = "577-581",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106114"}

@inproceedings{bb109441,
        AUTHOR = "Yu, J.",
        TITLE = "A Real-Time 3D Visual Singing Synthesis:
From Appearance to Internal Articulators",
        BOOKTITLE = MMMod17,
        YEAR = "2017",
        PAGES = "I: 53-64",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106115"}

@inproceedings{bb109442,
        AUTHOR = "Dawood, S. and Hicks, Y. and Marshall, D.",
        TITLE = "Speech-Driven Facial Animation Using Manifold Relevance Determination",
        BOOKTITLE = CVAVM16,
        YEAR = "2016",
        PAGES = "II: 869-882",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106116"}

@inproceedings{bb109443,
        AUTHOR = "Malleson, C. and Bazin, J.C. and Wang, O. and Bradley, D. and Beeler, T. and Hilton, A. and Sorkine Hornung, A.",
        TITLE = "FaceDirector: Continuous Control of Facial Performance in Video",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "3979-3987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106117"}

@inproceedings{bb109444,
        AUTHOR = "Musti, U. and Zhou, Z.H. and Pietikainen, M.",
        TITLE = "Facial 3D Shape Estimation from Images for Visual Speech Animation",
        BOOKTITLE = ICPR14,
        YEAR = "2014",
        PAGES = "40-45",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106118"}

@inproceedings{bb109445,
        AUTHOR = "Yu, J. and Li, A.",
        TITLE = "3D visual pronunciation of Mandarine Chinese for language learning",
        BOOKTITLE = ICIP14,
        YEAR = "2014",
        PAGES = "2036-2040",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106119"}

@inproceedings{bb109446,
        AUTHOR = "Anderson, R. and Stenger, B. and Wan, V. and Cipolla, R.",
        TITLE = "Expressive Visual Text-to-Speech Using Active Appearance Models",
        BOOKTITLE = CVPR13,
        YEAR = "2013",
        PAGES = "3382-3389",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106120"}

@inproceedings{bb109447,
        AUTHOR = "Manresa Yee, C. and Ponsa, P. and Arellano, D. and Larrea, M.",
        TITLE = "An Avatar Acceptance Study for Home Automation Scenarios",
        BOOKTITLE = AMDO12,
        YEAR = "2012",
        PAGES = "230-238",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106121"}

@inproceedings{bb109448,
        AUTHOR = "Tang, Y.Q. and Fang, Y. and Huang, Q.H.",
        TITLE = "Audio personalization using head related transfer function in 3DTV",
        BOOKTITLE = "3DTV11",
        YEAR = "2011",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106122"}

@inproceedings{bb109449,
        AUTHOR = "Liu, K. and Ostermann, J.",
        TITLE = "Realistic head motion synthesis for an image-based talking head",
        BOOKTITLE = FG11,
        YEAR = "2011",
        PAGES = "125-130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106123"}

@inproceedings{bb109450,
        AUTHOR = "Ostermann, J. and Liu, K.",
        TITLE = "Realistic head motion synthesis for an image-based talking head",
        BOOKTITLE = FG11,
        YEAR = "2011",
        PAGES = "221-226",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106123"}

@inproceedings{bb109451,
        AUTHOR = "Chaloupka, J. and Chaloupka, Z.",
        TITLE = "Czech Artificial Computerized Talking Head George",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "324-330",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106124"}

@inproceedings{bb109452,
        AUTHOR = "Zhao, H. and Chen, Y.B. and Shen, Y.M. and Tang, C.J.",
        TITLE = "Audio-Visual Speech Synthesis Based on Chinese Visual Triphone",
        BOOKTITLE = CISP09,
        YEAR = "2009",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106125"}

@inproceedings{bb109453,
        AUTHOR = "Hu, Y.L. and Zhou, M.Q. and Wu, Z.K.",
        TITLE = "An Automatic Dense Point Registration Method for 3D Face Animation",
        BOOKTITLE = CISP09,
        YEAR = "2009",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106126"}

@inproceedings{bb109454,
        AUTHOR = "Berger, M.O. and Ponroy, J. and Wrobel Dautcourt, B.",
        TITLE = "Realistic Face Animation for Audiovisual Speech Applications: A
Densification Approach Driven by Sparse Stereo Meshes",
        BOOKTITLE = MIRAGE09,
        YEAR = "2009",
        PAGES = "297-307",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106127"}

@inproceedings{bb109455,
        AUTHOR = "Verdet, F. and Hennebert, J.",
        TITLE = "Impostures of Talking Face Systems Using Automatic Face Animation",
        BOOKTITLE = BTAS08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106128"}

@inproceedings{bb109456,
        AUTHOR = "Gaur, U. and Jain, A. and Goel, S.",
        TITLE = "Towards Real-Time Monocular Video-Based Avatar Animation",
        BOOKTITLE = ISVC08,
        YEAR = "2008",
        PAGES = "II: 949-958",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106129"}

@inproceedings{bb109457,
        AUTHOR = "Badin, P. and Elisei, F. and Bailly, G. and Tarabalka, Y.",
        TITLE = "An Audiovisual Talking Head for Augmented Speech Generation: Models and
Animations Based on a Real Speaker's Articulatory Data",
        BOOKTITLE = AMDO08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106130"}

@inproceedings{bb109458,
        AUTHOR = "Fanelli, G. and Fratarcangeli, M.",
        TITLE = "A Non-Invasive Approach for Driving Virtual Talking Heads from Real
Facial Movements",
        BOOKTITLE = "3DTV07",
        YEAR = "2007",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106131"}

@inproceedings{bb109459,
        AUTHOR = "Xiong, L. and Zheng, N.N. and You, Q. and Liu, J.Y.",
        TITLE = "Facial Expression Sequence Synthesis Based on Shape and Texture Fusion
Model",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "IV: 473-476",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106132"}

@inproceedings{bb109460,
        AUTHOR = "Beaumesnil, B. and Luthon, F.",
        TITLE = "Real Time Tracking for 3D Realistic Lip Animation",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "I: 219-222",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106133"}

@inproceedings{bb109461,
        AUTHOR = "Ravindra de Silva, P. and Madurapperuma, A.P. and Marasinghe, A. and Osano, M.",
        TITLE = "Integrating Animated Pedagogical Agent as Motivational Supporter into
Interactive System",
        BOOKTITLE = CRV06,
        YEAR = "2006",
        PAGES = "34-34",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106134"}

@inproceedings{bb109462,
        AUTHOR = "Pei, Y.R. and Zha, H.B.",
        TITLE = "Vision Based Speech Animation Transferring with Underlying Anatomical
Structure",
        BOOKTITLE = ACCV06,
        YEAR = "2006",
        PAGES = "I:591-600",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106135"}

@inproceedings{bb109463,
        AUTHOR = "Liu, Y.H. and Xu, G.Y. and Tao, L.M.",
        TITLE = "An Efficient Approach for Multi-view Face Animation Based on Quasi 3D
Model",
        BOOKTITLE = ACCV06,
        YEAR = "2006",
        PAGES = "II:913-922",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106136"}

@inproceedings{bb109464,
        AUTHOR = "Leszczynski, M. and Skarbek, W.",
        TITLE = "Viseme Classification for Talking Head Application",
        BOOKTITLE = CAIP05,
        YEAR = "2005",
        PAGES = "773",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106137"}

@inproceedings{bb109465,
        AUTHOR = "Leszczynski, M. and Skarbek, W.",
        TITLE = "Viseme recognition: A comparative study",
        BOOKTITLE = AVSBS05,
        YEAR = "2005",
        PAGES = "287-292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106138"}

@inproceedings{bb109466,
        AUTHOR = "Leszczynski, M. and Skarbek, W. and Badura, S.",
        TITLE = "Fast Viseme Recognition for Talking Head Application",
        BOOKTITLE = ICIAR05,
        YEAR = "2005",
        PAGES = "516-523",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106139"}

@inproceedings{bb109467,
        AUTHOR = "Gracia Roche, J.J. and Orrite, C. and Bernues, E. and Herrero, J.E.",
        TITLE = "Color Distribution Tracking for Facial Analysis",
        BOOKTITLE = IbPRIA05,
        YEAR = "2005",
        PAGES = "I:484",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106140"}

@inproceedings{bb109468,
        AUTHOR = "Ypsilos, I.A. and Hilton, A. and Turkmani, A. and Jackson, P.J.B.",
        TITLE = "Speech-driven face synthesis from 3D video",
        BOOKTITLE = "3DPVT04",
        YEAR = "2004",
        PAGES = "58-65",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106141"}

@inproceedings{bb109469,
        AUTHOR = "Saisan, P. and Bissacco, A. and Chiuso, A. and Soatto, S.",
        TITLE = "Modeling and Synthesis of Facial Motion Driven by Speech",
        BOOKTITLE = ECCV04,
        YEAR = "2004",
        PAGES = "Vol III: 456-467",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106142"}

@inproceedings{bb109470,
        AUTHOR = "Malcangi, M. and de Tintis, R.",
        TITLE = "Audio Based Real-Time Speech Animation of Embodied Conversational
Agents",
        BOOKTITLE = GW03,
        YEAR = "2003",
        PAGES = "350-360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106143"}

@inproceedings{bb109471,
        AUTHOR = "Aleksic, P.S. and Katsaggelos, A.K.",
        TITLE = "Speech-to-video synthesis using facial animation parameters",
        BOOKTITLE = ICIP03,
        YEAR = "2003",
        PAGES = "III: 1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106144"}

@inproceedings{bb109472,
        AUTHOR = "Hack, C.A. and Taylor, C.J.",
        TITLE = "Modelling 'Talking Head' Behaviour",
        BOOKTITLE = BMVC03,
        YEAR = "2003",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106145"}

@inproceedings{bb109473,
        AUTHOR = "Choi, K.H. and Hwang, J.N.",
        TITLE = "Creating 3D speech-driven talking heads: a probabilistic network
approach",
        BOOKTITLE = ICIP02,
        YEAR = "2002",
        PAGES = "I: 984-987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106146"}

@inproceedings{bb109474,
        AUTHOR = "Hong, P.Y. and Wen, Z. and Huang, T.S. and Shum, H.Y.",
        TITLE = "Real-time speech-driven 3D face animation",
        BOOKTITLE = "3DPVT02",
        YEAR = "2002",
        PAGES = "713-716",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106147"}

@inproceedings{bb109475,
        AUTHOR = "Morishima, S. and Yotsukura, T.",
        TITLE = "Hypermask: Talking Head Projected Onto Moving Surface",
        BOOKTITLE = ICIP01,
        YEAR = "2001",
        PAGES = "III: 947-950",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106148"}

@inproceedings{bb109476,
        AUTHOR = "Neumann, J. and Aloimonos, Y.",
        TITLE = "Talking Heads: Introducing the tool of 3D motion fields in the study of
action",
        BOOKTITLE = HUMO00,
        YEAR = "2000",
        PAGES = "25-32",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106149"}

@inproceedings{bb109477,
        AUTHOR = "Chen, T.H. and Wang, Y. and Graf, H.P. and Swain, C.T.",
        TITLE = "A new frame interpolation scheme for talking head sequences",
        BOOKTITLE = ICIP95,
        YEAR = "1995",
        PAGES = "II: 591-594",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106150"}

@inproceedings{bb109478,
        AUTHOR = "Shan, S.",
        TITLE = "Individual 3d Face Synthesis Based on Orthogonal Photos and
Speech-driven Facial Animation",
        BOOKTITLE = ICIP00,
        YEAR = "2000",
        PAGES = "Vol III: 238-241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106151"}

@inproceedings{bb109479,
        AUTHOR = "Noh, J.Y. and Neumann, U.",
        TITLE = "Talking Face",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "TA1",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106152"}

@inproceedings{bb109480,
        AUTHOR = "Kakihara, K. and Nakamura, S. and Shikano, K.",
        TITLE = "Speech-To-Face Movement Synthesis Based on HMMS",
        BOOKTITLE = ICME00,
        YEAR = "2000",
        PAGES = "MP7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106153"}

@inproceedings{bb109481,
        AUTHOR = "Van Gool, L.J. and Tuytelaars, T. and Pollefeys, M.",
        TITLE = "Adventurous Tourism for Couch Potatoes",
        BOOKTITLE = CAIP99,
        YEAR = "1999",
        PAGES = "98-107",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106154"}

@inproceedings{bb109482,
        AUTHOR = "Ishikawa, T. and Sera, H. and Morishima, S. and Terzopoulos, D.",
        TITLE = "Facial Image Reconstruction by Estimated Muscle Parameter",
        BOOKTITLE = AFGR98,
        YEAR = "1998",
        PAGES = "342-347",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106155"}

@inproceedings{bb109483,
        AUTHOR = "Bothe, H.H.",
        TITLE = "A visual speech model based on fuzzy-neuro methods",
        BOOKTITLE = CIAP95,
        YEAR = "1995",
        PAGES = "152-158",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106156"}

@article{bb109484,
        AUTHOR = "Lavagetto, F.",
        TITLE = "Time-Delay Neural Networks for Estimating Lip Movements from
Speech Analysis:
A Useful Tool in Audio Video Synchronization",
        JOURNAL = CirSysVideo,
        VOLUME = "7",
        YEAR = "1997",
        NUMBER = "5",
        MONTH = "October",
        PAGES = "786-800",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106157"}

@inproceedings{bb109485,
        AUTHOR = "Gasper, E. and Matthews, J.H. and Wesley, R.",
        TITLE = "Advanced tools for speech synchronized animation",
        BOOKTITLE = US_Patent,
        YEAR = "1997",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106158"}

@inproceedings{bb109486,
        AUTHOR = "Wesley, R. and Matthews, J.H. and Gasper, E.",
        TITLE = "Advanced tools for speech synchronized animation",
        BOOKTITLE = US_Patent,
        YEAR = "1997",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106158"}

@inproceedings{bb109487,
        AUTHOR = "Gasper, E. and Wesley, R.",
        TITLE = "Advanced tools for speech synchronized animation",
        BOOKTITLE = US_Patent,
        YEAR = "1997",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106158"}

@article{bb109488,
        AUTHOR = "Chien, J.T. and Lin, M.S.",
        TITLE = "Frame-synchronous noise compensation for hands-free speech recognition
in car environments",
        JOURNAL = VISP,
        VOLUME = "147",
        YEAR = "2000",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "508-515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106159"}

@inproceedings{bb109489,
        AUTHOR = "Rosenfeld, M.",
        TITLE = "Method for automatically animating lip synchronization and
facial expression of animated characters",
        BOOKTITLE = US_Patent,
        YEAR = "2001",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106160"}

@inproceedings{bb109490,
        AUTHOR = "Haisma, N. and Sinke, J.G. and Bergevoet, B.A.J. and van Gestel, H.A.W.",
        TITLE = "Post-synchronizing an information stream including lip
objects replacement",
        BOOKTITLE = US_Patent,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106161"}

@inproceedings{bb109491,
        AUTHOR = "Huang, Y. and Lin, S.S.T. and Guo, B.N. and Shum, H.Y.",
        TITLE = "System and method for real time lip synchronization",
        BOOKTITLE = US_Patent,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106162"}

@article{bb109492,
        AUTHOR = "Saenko, K. and Livescu, K. and Glass, J. and Darrell, T.J.",
        TITLE = "Multistream Articulatory Feature-Based Models for Visual Speech
Recognition",
        JOURNAL = PAMI,
        VOLUME = "31",
        YEAR = "2009",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1700-1707",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106163"}

@inproceedings{bb109493,
        AUTHOR = "Saenko, K. and Livescu, K. and Siracusa, M. and Wilson, K. and Glass, J. and Darrell, T.J.",
        TITLE = "Visual Speech Recognition with Loosely Synchronized Feature Streams",
        BOOKTITLE = ICCV05,
        YEAR = "2005",
        PAGES = "II: 1424-1431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106164"}

@article{bb109494,
        AUTHOR = "El Sallam, A.A. and Mian, A.S.",
        TITLE = "Correlation based speech-video synchronization",
        JOURNAL = PRL,
        VOLUME = "32",
        YEAR = "2011",
        NUMBER = "6",
        MONTH = "April",
        PAGES = "780-786",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106165"}

@inproceedings{bb109495,
        AUTHOR = "El Sallam, A.A. and Mian, A.S.",
        TITLE = "Speech-Video Synchronization Using Lips Movements and Speech Envelope
Correlation",
        BOOKTITLE = ICIAR09,
        YEAR = "2009",
        PAGES = "397-407",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106166"}

@article{bb109496,
        AUTHOR = "Chen, Y.M. and Huang, F.C. and Guan, S.H. and Chen, B.Y.",
        TITLE = "Animating Lip-Sync Characters With Dominated Animeme Models",
        JOURNAL = CirSysVideo,
        VOLUME = "22",
        YEAR = "2012",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1344-1353",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106167"}

@article{bb109497,
        AUTHOR = "Srinivasan, V. and Bethel, C.L. and Murphy, R.R.",
        TITLE = "Evaluation of Head Gaze Loosely Synchronized With Real-Time Synthetic
Speech for Social Robots",
        JOURNAL = HMS,
        VOLUME = "44",
        YEAR = "2014",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "767-778",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106168"}

@article{bb109498,
        AUTHOR = "Liu, N. and Zhou, T. and Ji, Y.F. and Zhao, Z.Y. and Wan, L.H.",
        TITLE = "Synthesizing Talking Faces from Text and Audio: An Autoencoder and
Sequence-to-Sequence Convolutional Neural Network",
        JOURNAL = PR,
        VOLUME = "102",
        YEAR = "2020",
        PAGES = "107231",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106169"}

@article{bb109499,
        AUTHOR = "Yu, L. and Yu, J. and Li, M. and Ling, Q.",
        TITLE = "Multimodal Inputs Driven Talking Face Generation With
Spatial-Temporal Dependency",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "203-216",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe500syncav1.html#TT106170"}

Last update:Jan 8, 2026 at 12:52:16