@article{bb109800,
        AUTHOR = "Lyu, J.Y. and Lan, X. and Hu, G. and Jiang, H.Y. and Gan, W. and Wang, J.B. and Xue, J.",
        TITLE = "Multimodal Emotional Talking Face Generation Based on Action Units",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "4026-4038",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106473"}

@article{bb109801,
        AUTHOR = "Chen, K.L. and Li, Z.Z. and Cui, F. and Ni, M. and Wang, S.Y. and Che, J.L. and Liu, F. and Qi, Y.G. and Zhang, F.W. and Liu, J. and Guo, G. and Fu, R.R. and Huang, Y.X.",
        TITLE = "FastTalker: Real-time audio-driven talking face generation with 3D
Gaussian",
        JOURNAL = IVC,
        VOLUME = "159",
        YEAR = "2025",
        PAGES = "105573",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106474"}

@article{bb109802,
        AUTHOR = "Chen, L.Y. and Bao, W.H. and Lei, S. and Tang, B. and Wu, Z.Y. and Kang, S.Y. and Huang, H.Z. and Meng, H.",
        TITLE = "AdaMesh: Personalized Facial Expressions and Head Poses for Adaptive
Speech-Driven 3D Facial Animation",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "3598-3609",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106475"}

@article{bb109803,
        AUTHOR = "Zhou, M. and Bai, Y. and Zhang, W. and Yao, T. and Zhao, T.J.",
        TITLE = "Interactive Conversational Head Generation",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6673-6686",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106476"}

@article{bb109804,
        AUTHOR = "Chu, Z.J. and Guo, K.L. and Xing, X.F. and Liu, P.S. and Cai, B. and Xu, X.M.",
        TITLE = "DCPTalk: Speech-Driven 3D Face Animation With Personalized Facial
Dynamic Coupling Properties",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "4427-4440",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106477"}

@article{bb109805,
        AUTHOR = "Shi, W.Z. and Xue, Z. and Wen, Y.",
        TITLE = "Keypoints and Action Units Jointly Drive Talking Head Generation for
Video Conferencing",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "8692-8706",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106478"}

@article{bb109806,
        AUTHOR = "Tang, J.X. and Wang, K.S.Y. and Zhou, H. and Chen, X.K. and He, D.L. and Hu, T.S. and Liu, J.T. and Liu, Z.W. and Zeng, G. and Wang, J.D.",
        TITLE = "Real-Time Neural Radiance Talking Portrait Synthesis via Audio-Spatial
Decomposition",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "6362-6373",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106479"}

@article{bb109807,
        AUTHOR = "Ma, Y.F. and Wang, S. and Ding, Y. and Ma, B. and Lv, T.J. and Fan, C.J. and Hu, Z.P. and Deng, Z.D. and Yu, X.",
        TITLE = "TalkCLIP: Talking Head Generation with Text-Guided Expressive
Speaking Styles",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "6335-6346",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106480"}

@article{bb109808,
        AUTHOR = "Vo, A.H. and Kim, T.S. and Jin, H. and Choi, S.M. and Kim, Y.G.",
        TITLE = "Instruction-Driven 3D Facial Expression Generation and Transition",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "6140-6153",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106481"}

@article{bb109809,
        AUTHOR = "Chen, X. and Tang, H.D. and Yang, X.Y.",
        TITLE = "Audio-driven face generation via spatial attention and facial contour
guidance for lip synchronization",
        JOURNAL = PRL,
        VOLUME = "197",
        YEAR = "2025",
        PAGES = "154-160",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106482"}

@article{bb109810,
        AUTHOR = "Yang, D. and Liu, Y. and Yang, Q.Y. and Li, R.",
        TITLE = "FacialTalk: Audio-driven high-fidelity facial portrait generation
using 3D facial prior",
        JOURNAL = PR,
        VOLUME = "171",
        YEAR = "2026",
        PAGES = "111994",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106483"}

@article{bb109811,
        AUTHOR = "Chu, Z.J. and Guo, K.L. and Xing, X.F. and Cai, B. and He, S. and Xu, X.M.",
        TITLE = "Alleviating One-to-Many Mapping in Talking Head Synthesis With
Dynamic Adaptation Context and Style Adapter",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "10801-10814",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106484"}

@article{bb109812,
        AUTHOR = "Zhang, Y.M. and Gu, Y.C. and Zeng, Y.H. and Xing, Z.N. and Wang, Y.C. and Wu, Z.Z. and Liu, B. and Chen, K.",
        TITLE = "FoleyCrafter: Bring Silent Videos to Life with Lifelike and
Synchronized Sounds",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "46",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106485"}

@article{bb109813,
        AUTHOR = "Wu, S.J. and Li, Y.H. and Zhang, W. and Jia, J. and Zhu, Y.C. and Yan, Y.C. and Zhai, G.T. and Yang, X.K.",
        TITLE = "SingingHead: A Large-Scale 4D Dataset for Singing Head Animation",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "700-714",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106486"}

@article{bb109814,
        AUTHOR = "Nocentini, F. and Ferrari, T.B.C. and Arguillere, S. and Daoudi, M. and Berretti, S.",
        TITLE = "Beyond Fixed Topologies: Unregistered Training and Comprehensive
Evaluation Metrics for 3D Talking Heads",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106487"}

@article{bb109815,
        AUTHOR = "Yang, C.L. and Yao, K. and Yan, Y.Y. and Jiang, C.R. and Zhao, W.G. and Sun, J. and Cheng, G.L. and Zhang, Y.F. and Dong, B. and Huang, K.Z.",
        TITLE = "Unlock Pose Diversity: Accurate and Efficient Implicit Keypoint-based
Spatiotemporal Diffusion for Audio-driven Talking Portrait",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "111",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106488"}

@article{bb109816,
        AUTHOR = "Meng, M. and Zhao, Y.F. and Zhang, B. and Zhu, Y.G. and Shi, W.M. and Wen, M. and Fan, Z.X.",
        TITLE = "A Survey of Talking Head Synthesis Techniques: Portrait Generation,
Driving Mechanisms, and Editing",
        JOURNAL = Surveys,
        VOLUME = "58",
        YEAR = "2026",
        NUMBER = "7",
        MONTH = "February",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106489"}

@article{bb109817,
        AUTHOR = "Wang, L. and Chen, G.B. and Liu, F. and Wu, J.J. and Cheng, J.",
        TITLE = "Speech2Blend: A Hybrid Network for Speech-Driven 3-D Facial Animation
by Learning Blendshape",
        JOURNAL = HMS,
        VOLUME = "56",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "February",
        PAGES = "48-57",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106490"}

@article{bb109818,
        AUTHOR = "Xu, Z.H. and Chen, T.S. and Yang, Z.J. and Qing, C.M. and Wang, K. and Lin, L.",
        TITLE = "Exploiting Temporal Audio-Visual Correlation Embedding for
Audio-Driven One-Shot Talking Head Animation",
        JOURNAL = MultMed,
        VOLUME = "28",
        YEAR = "2026",
        PAGES = "1014-1024",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106491"}

@article{bb109819,
        AUTHOR = "Li, X.N. and Sheng, X. and Wang, M. and Ou, F.Z. and Chen, B.L. and Wang, S.Q. and Kwong, S.",
        TITLE = "CoFaCo: Controllable Generative Talking Face Video Coding",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "465-479",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106492"}

@inproceedings{bb109820,
        AUTHOR = "Sun, X. and Zhang, L.H. and Zhu, H. and Zhang, P. and Zhang, B. and Ji, X. and Zhou, K. and Gao, D. and Bo, L. and Cao, X.",
        TITLE = "VividTalk: One-Shot Audio-Driven Talking Head Generation Based on 3D
Hybrid Prior",
        BOOKTITLE = "3DV25",
        YEAR = "2025",
        PAGES = "713-722",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106493"}

@inproceedings{bb109821,
        AUTHOR = "Guo, W.J. and Kaneko, N. and Akazawa, Y.",
        TITLE = "Low-Latency Real-Time Audio-Driven Talking Head Generation Based on
Future Speech Feature Prediction",
        BOOKTITLE = MVA25,
        YEAR = "2025",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106494"}

@inproceedings{bb109822,
        AUTHOR = "Liu, X.H. and Min, X.K. and Hu, Q. and Zhang, X.Y. and Guo, J. and Zhai, G.T. and Wang, S. and Zhou, Y.J. and Liu, L. and Li, J.X. and Yang, L. and Wen, F. and Xu, L. and Jiang, Y.W. and Zhu, X. and Li, C.Y. and Zhang, Z.C. and Duan, H.Y. and Wu, X. and Gao, Y.X. and Cao, Y.Q. and Jia, J. and Sun, W. and Cao, J. and Timofte, R. and Li, B. and Huang, J. and Luo, D. and Liu, T. and Zhang, W.X. and Zheng, B.K. and Chen, J.L. and Zhou, R.K. and Chen, M. and Wang, Y. and Jiang, H. and Li, X.T. and Jiang, Y.X. and Tang, J. and Zhao, Y.M. and Hu, B. and Qi, Z. and Zhang, C.Y. and Zhao, F. and Shi, P. and Fu, L.Z. and Cong, H. and He, S. and Zhang, R. and He, J. and Hu, Z.Y. and Luo, W. and Yu, Z. and Guan, F.B. and Lu, Y.T. and Li, X. and Chen, Z.B. and Su, M.J. and Wang, Y. and Chen, T. and Li, C.X. and Zhao, S. and Wen, J.X. and Lin, C. and Liu, S. and Chu, N.X. and Wan, J. and Zhou, Y. and Chen, B.Y. and Zeng, J. and Liu, J.R. and Liu, X.J. and Chen, X. and Zhou, L. and Li, H. and Han, Y. and Xiang, B. and Liu, Z.J. and Lu, J.Z. and Gui, J.L. and Lu, R.J. and Wang, S.F. and Zhou, D.H. and Lin, J.Y. and Song, Q.J. and Huang, J.C. and Yang, Y.F. and Wang, C.W. and Zhong, S. and Yang, Y. and He, L. and Liu, J. and Xing, Y.T. and Fang, T. and Jin, Y.C.",
        TITLE = "Ntire 2025 XGC Quality Assessment Challenge: Methods and Results",
        BOOKTITLE = NTIRE25,
        YEAR = "2025",
        PAGES = "978-992",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106495"}

@inproceedings{bb109823,
        AUTHOR = "Su, M.J. and Wang, Y. and Chen, T. and Li, C.X. and Zhao, S. and Wen, J.X. and Lin, C. and Liu, S. and Chu, N.X. and Zhou, Y.",
        TITLE = "Quality Assessment for Talking Head Videos via Multi-Modal Feature
Representation",
        BOOKTITLE = NTIRE25,
        YEAR = "2025",
        PAGES = "1405-1411",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106496"}

@inproceedings{bb109824,
        AUTHOR = "Wang, X. and Song, R.H. and Li, C.X. and Cheng, X. and Li, B. and Wu, Y.H. and Wang, Y.Y. and Xu, H.T. and Wang, Y.F.",
        TITLE = "Animate and Sound an Image",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "23369-23378",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106497"}

@inproceedings{bb109825,
        AUTHOR = "Zhu, Y.M. and Zhang, L.H. and Rong, Z.K. and Hu, T.S. and Liang, S. and Ge, Z.P.",
        TITLE = "INFP: Audio-Driven Interactive Head Generation in Dyadic
Conversations",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10667-10677",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106498"}

@inproceedings{bb109826,
        AUTHOR = "Guan, J.Z. and Wang, K.Y. and Xu, Z.L. and Yang, Q.W. and Sun, Y.S. and He, S.Y. and Liang, B. and Cao, Y. and Li, Y.Y. and Feng, H.C. and Ding, E. and Wang, J.D. and Zhao, Y.J. and Zhou, H. and Liu, Z.W.",
        TITLE = "AudCast: Audio-Driven Human Video Generation by Cascaded Diffusion
Transformers",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10678-10689",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106499"}

@inproceedings{bb109827,
        AUTHOR = "Li, H. and Dai, J. and Zhao, X. and Zhou, F. and Pan, J.J. and Li, L.",
        TITLE = "Wav2Sem: Plug-and-Play Audio Semantic Decoupling for 3D Speech-Driven
Facial Animation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "183-192",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106500"}

@inproceedings{bb109828,
        AUTHOR = "Li, H. and Dai, J. and Zhao, X. and Zhou, F. and Pan, J.J. and Li, L.",
        TITLE = "Wav2Sem: Plug-and-Play Audio Semantic Decoupling for 3D Speech-Driven
Facial Animation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "183-192",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106501"}

@inproceedings{bb109829,
        AUTHOR = "Wang, S.Z. and Li, X.T. and Liu, C. and Chan, M. and Stengel, M. and Fuchs, H. and de Mello, S. and Nagano, K.",
        TITLE = "Coherent 3D Portrait Video Reconstruction via Triplane Fusion",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10712-10722",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106502"}

@inproceedings{bb109830,
        AUTHOR = "Ji, X.Z. and Hu, X.B. and Xu, Z.H. and Zhu, J.W. and Lin, C. and He, Q. and Zhang, J.N. and Luo, D.H. and Chen, Y. and Lin, Q. and Lu, Q.L. and Wang, C.J.",
        TITLE = "Sonic: Shifting Focus to Global Audio Perception in Portrait
Animation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "193-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106503"}

@inproceedings{bb109831,
        AUTHOR = "Lai, P. and Zhong, W.Z. and Qin, Y.P. and Ren, X.H. and Wang, B.Y. and Li, G.B.",
        TITLE = "LLM-driven Multimodal and Multi-Identity Listening Head Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10656-10666",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106504"}

@inproceedings{bb109832,
        AUTHOR = "Li, H. and Dai, J. and Zhao, X. and Zhou, F. and Pan, J.J. and Li, L.",
        TITLE = "Wav2Sem: Plug-and-Play Audio Semantic Decoupling for 3D Speech-Driven
Facial Animation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "183-192",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106505"}

@inproceedings{bb109833,
        AUTHOR = "Zhen, D.C. and Yin, S. and Qin, S. and Yi, H. and Zhang, Z.W. and Liu, S.Y. and Qi, G. and Tao, M.",
        TITLE = "Teller: Real-Time Streaming Audio-Driven Portrait Animation with
Autoregressive Motion Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21075-21085",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106506"}

@inproceedings{bb109834,
        AUTHOR = "Li, X. and Wang, J.Y. and Cheng, Y.H. and Zeng, Y.K. and Ren, X.Y. and Zhu, W.H. and Zhao, W.M. and Yan, Y.C.",
        TITLE = "Towards High-fidelity 3D Talking Avatar with Personalized Dynamic
Texture",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "204-214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106507"}

@inproceedings{bb109835,
        AUTHOR = "Zhong, T.Y. and Liang, C. and Jiang, J.W. and Lin, G. and Yang, J.Q. and Zhao, Z.",
        TITLE = "FADA: Fast Diffusion Avatar Synthesis with Mixed-Supervised Multi-CFG
Distillation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "3101-3110",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106508"}

@inproceedings{bb109836,
        AUTHOR = "Gong, S.J. and Li, H.J. and Tang, J.P. and Hu, D.M. and Huang, S. and Chen, H. and Chen, T.S. and Liu, Z.",
        TITLE = "Monocular and Generalizable Gaussian Talking Head Animation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "5523-5534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106509"}

@inproceedings{bb109837,
        AUTHOR = "Li, J. and Zhang, J.W. and Bai, X. and Zheng, J. and Zhou, J. and Gu, L.",
        TITLE = "InsTaG: Learning Personalized 3D Talking Head from Few-Second Video",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10690-10700",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106510"}

@inproceedings{bb109838,
        AUTHOR = "Chen, J.C. and Hu, J. and Wang, G. and Jiang, Z.H. and Zhou, T. and Chen, Z.W. and Lv, C.F.",
        TITLE = "TaoAvatar: Real-Time Lifelike Full-Body Talking Avatars for Augmented
Reality via 3D Gaussian Splatting",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "10723-10734",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106511"}

@inproceedings{bb109839,
        AUTHOR = "Gan, Y. and Miao, J.X. and Wang, Y.Z. and Yang, Y.",
        TITLE = "Silence is Golden: Leveraging Adversarial Examples to Nullify Audio
Control in LDM-based Talking-Head Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "13434-13444",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106512"}

@inproceedings{bb109840,
        AUTHOR = "Peng, Z.Q. and Fan, Y.B. and Wu, H.Y. and Wang, X. and Liu, H.Y. and He, J. and Fan, Z.X.",
        TITLE = "DualTalk: Dual-Speaker Interaction for 3D Talking Head Conversations",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21055-21064",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106513"}

@inproceedings{bb109841,
        AUTHOR = "Chae Yeon, L. and Hyun Bin, O. and EunGi, H. and Sung Bin, K. and Nam, S. and Oh, T.H.",
        TITLE = "Perceptually Accurate 3D Talking Head Generation: New Definitions,
Speech-Mesh Representation, and Evaluation Metrics",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21065-21074",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106514"}

@inproceedings{bb109842,
        AUTHOR = "Li, Y. and Bai, Z.Q. and Tan, F. and Cui, Z.P. and Fanello, S. and Zhang, Y.",
        TITLE = "IM-Portrait: Learning 3D-aware Video Diffusion for Photorealistic
Talking Heads from Monocular Videos",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "21107-21116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106515"}

@inproceedings{bb109843,
        AUTHOR = "Zhao, S. and Hong, F.T. and Huang, X.S. and Xu, D.",
        TITLE = "Synergizing Motion and Appearance: Multi-Scale Compensatory Codebooks
for Talking Head Video Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "26232-26241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106516"}

@inproceedings{bb109844,
        AUTHOR = "Wang, H.T. and Weng, Y.Z. and Li, Y.Y. and Guo, Z.L. and Du, J. and Niu, S.T. and Ma, J.F. and He, S. and Wu, X.Y. and Hu, Q.M. and Yin, B. and Liu, C. and Liu, Q.F.",
        TITLE = "EmotiveTalk: Expressive Talking Head Generation through Audio
Information Decoupling and Emotional Video Diffusion",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "26212-26221",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106517"}

@inproceedings{bb109845,
        AUTHOR = "Khungurn, P.",
        TITLE = "Talking Head Anime 4: Distillation for Real-Time Performance",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "5018-5029",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106518"}

@inproceedings{bb109846,
        AUTHOR = "Hogue, S. and Zhang, C.X. and Tian, Y.P. and Guo, X.",
        TITLE = "Joint Co-Speech Gesture and Expressive Talking Face Generation Using
Diffusion with Adapters",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "4163-4172",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106519"}

@inproceedings{bb109847,
        AUTHOR = "Diao, X.J. and Cheng, M. and Barrios, W. and Jin, S.",
        TITLE = "FT2TF: First-Person Statement Text-to-Talking Face Generation",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "4821-4830",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106520"}

@inproceedings{bb109848,
        AUTHOR = "Ki, T. and Min, D. and Chae, G.",
        TITLE = "Learning to Generate Conditional Tri-plane for 3d-aware Expression
Controllable Portrait Animation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "I: 476-493",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106521"}

@inproceedings{bb109849,
        AUTHOR = "Tian, L. and Wang, Q. and Zhang, B. and Bo, L.",
        TITLE = "EMO: Emote Portrait Alive Generating Expressive Portrait Videos with
Audio2video Diffusion Model Under Weak Conditions",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXXXIII: 244-260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106522"}

@inproceedings{bb109850,
        AUTHOR = "Fan, X.Y. and Li, J.Q. and Lin, Z.Q. and Xiao, W.Y. and Yang, L.",
        TITLE = "Unitalker: Scaling up Audio-driven 3d Facial Animation Through A
Unified Model",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLI: 204-221",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106523"}

@inproceedings{bb109851,
        AUTHOR = "Deng, Y. and Wang, D. and Wang, B.Y.",
        TITLE = "Portrait4D-V2: Pseudo Multi-view Data Creates Better 4d Head
Synthesizer",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XVII: 316-333",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106524"}

@inproceedings{bb109852,
        AUTHOR = "Xu, Z.H. and Gong, S.J. and Tang, J.P. and Liang, L.Y. and Huang, Y. and Li, H.J. and Huang, S.P.",
        TITLE = "Kmtalk: Speech-driven 3d Facial Animation with Key Motion Embedding",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LVI: 236-253",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106525"}

@inproceedings{bb109853,
        AUTHOR = "Nocentini, F. and Besnier, T. and Ferrari, C. and Arguillere, S. and Berretti, S. and Daoudi, M.",
        TITLE = "Scantalk: 3d Talking Heads from Unregistered Scans",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXIX: 19-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106526"}

@inproceedings{bb109854,
        AUTHOR = "Prashnani, E. and Nagano, K. and de Mello, S. and Luebke, D. and Gallo, O.",
        TITLE = "Avatar Fingerprinting for Authorized Use of Synthetic Talking-head
Videos",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XV: 209-228",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106527"}

@inproceedings{bb109855,
        AUTHOR = "Li, D.Z. and Zhao, K. and Wang, W. and Ma, Y.F. and Peng, B. and Zhang, Y.Y. and Dong, J.",
        TITLE = "S^3d-nerf: Single-shot Speech-driven Neural Radiance Field for High
Fidelity Talking Head Synthesis",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "X: 365-382",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106528"}

@inproceedings{bb109856,
        AUTHOR = "Wu, X.Z. and Sun, Y.T. and Chen, H. and Zhou, H. and Wang, J.D. and Liu, Z.Z. and Qi, X.J.",
        TITLE = "3D-Aware Text-Driven Talking Avatar Generation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXXXVIII: 416-433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106529"}

@inproceedings{bb109857,
        AUTHOR = "Zhang, W.X. and Zhu, C.G. and Gao, J.N. and Yan, Y.C. and Zhai, G.T. and Yang, X.K.",
        TITLE = "A Comparative Study of Perceptual Quality Metrics For Audio-Driven
Talking Head Videos",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "1218-1224",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106530"}

@inproceedings{bb109858,
        AUTHOR = "Lei, H. and Bie, Z. and Jing, Z. and Bie, H.X.",
        TITLE = "Talking-Head Video Compression With Motion Semantic Enhancement Model",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "1980-1986",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106531"}

@inproceedings{bb109859,
        AUTHOR = "Xing, Y.Z. and He, Y.Q. and Tian, Z. and Wang, X.T. and Chen, Q.F.",
        TITLE = "Seeing and Hearing: Open-domain Visual-Audio Generation with
Diffusion Latent Aligners",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7151-7161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106532"}

@inproceedings{bb109860,
        AUTHOR = "Mughal, M.H. and Dabral, R. and Habibie, I. and Donatelli, L. and Habermann, M. and Theobalt, C.",
        TITLE = "ConvoFusion: Multi-Modal Conversational Diffusion for Co-Speech
Gesture Synthesis",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "1388-1398",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106533"}

@inproceedings{bb109861,
        AUTHOR = "Mehta, S. and Deichler, A. and O'Regan, J. and Moell, B. and Beskow, J. and Henter, G.E. and Alexanderson, S.",
        TITLE = "Fake it to make it: Using synthetic data to remedy the data shortage
in joint multi-modal speech-and-gesture synthesis",
        BOOKTITLE = HUMOGen24,
        YEAR = "2024",
        PAGES = "1952-1964",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106534"}

@inproceedings{bb109862,
        AUTHOR = "Zhang, Q. and Xiao, T. and Habeeb, H. and Laich, L. and Bouaziz, S. and Snape, P. and Zhang, W.J. and Cioffi, M. and Zhang, P.Z. and Pidlypenskyi, P. and Lin, W. and Ma, L. and Wang, M.J. and Li, K.P. and Long, C.J. and Song, S. and Prazak, M. and Sjoholm, A. and Deogade, A. and Lee, J. and Mangas, J.D. and Aubel, A.",
        TITLE = "REFA: Real-time Egocentric Facial Animations for Virtual Reality",
        BOOKTITLE = ABAW24,
        YEAR = "2024",
        PAGES = "4793-4802",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106535"}

@inproceedings{bb109863,
        AUTHOR = "Yang, K.D. and Ranjan, A. and Chang, J.H.R. and Vemulapalli, R. and Tuzel, O.",
        TITLE = "Probabilistic Speech-Driven 3D Facial Motion Synthesis: New
Benchmarks, Methods, and Applications",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "27284-27293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106536"}

@inproceedings{bb109864,
        AUTHOR = "Liu, Y.F. and Cao, Q. and Wen, Y.D. and Jiang, H. and Ding, C.X.",
        TITLE = "Towards Variable and Coordinated Holistic Co-Speech Motion Generation",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "1566-1576",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106537"}

@inproceedings{bb109865,
        AUTHOR = "Ng, E. and Romero, J. and Bagautdinov, T. and Bai, S.J. and Darrell, T.J. and Kanazawa, A. and Richard, A.",
        TITLE = "From Audio to Photoreal Embodiment:
Synthesizing Humans in Conversations",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "1001-1010",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106538"}

@inproceedings{bb109866,
        AUTHOR = "Zhang, Z.C. and Zheng, R. and Li, B. and Han, C.Y. and Li, T.Q. and Wang, M. and Guo, T.D. and Chen, J.D. and Liu, Z.W. and Yang, M.",
        TITLE = "Learning Dynamic Tetrahedra for High-Quality Talking Head Synthesis",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "5209-5219",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106539"}

@inproceedings{bb109867,
        AUTHOR = "Jang, Y.J. and Kim, J.H. and Ahn, J. and Kwak, D. and Yang, H.S. and Ju, Y.C. and Kim, I.H. and Kim, B.Y. and Chung, J.S.",
        TITLE = "Faces that Speak: Jointly Synthesising Talking Face and Speech from
Text",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "8818-8828",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106540"}

@inproceedings{bb109868,
        AUTHOR = "Aneja, S. and Thies, J. and Dai, A. and Niessner, M.",
        TITLE = "FaceTalk: Audio-Driven Motion Diffusion for Neural Parametric Head
Models",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "21263-21273",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106541"}

@inproceedings{bb109869,
        AUTHOR = "Hogue, S. and Zhang, C.X. and Daruger, H. and Tian, Y.P. and Guo, X.H.",
        TITLE = "DiffTED: One-shot Audio-driven TED Talk Video Generation with
Diffusion-based Co-speech Gestures",
        BOOKTITLE = HUMOGen24,
        YEAR = "2024",
        PAGES = "1922-1931",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106542"}

@inproceedings{bb109870,
        AUTHOR = "Yaman, D. and Eyiokur, F.I. and Barmann, L. and Akti, S. and Ekenel, H.K. and Waibel, A.",
        TITLE = "Audio-Visual Speech Representation Expert for Enhanced Talking Face
Video Generation and Evaluation",
        BOOKTITLE = NTIRE24,
        YEAR = "2024",
        PAGES = "6003-6013",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106543"}

@inproceedings{bb109871,
        AUTHOR = "Pham, T.T. and Do, T. and Le, N. and Le, N. and Nguyen, H. and Tjiputra, E. and Tran, Q. and Nguyen, A.",
        TITLE = "Style Transfer for 2D Talking Head Generation",
        BOOKTITLE = GCV24,
        YEAR = "2024",
        PAGES = "7500-7509",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106544"}

@inproceedings{bb109872,
        AUTHOR = "Xu, C. and Liu, Y. and Xing, J.Z. and Wang, W. and Sun, M.Z. and Dan, J. and Huang, T.X. and Li, S.Y. and Cheng, Z.Q. and Tai, Y. and Sun, B.",
        TITLE = "FaceChain-ImagineID: Freely Crafting High-Fidelity Diverse Talking
Faces from Disentangled Audio",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "1292-1302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106545"}

@inproceedings{bb109873,
        AUTHOR = "Stypulkowski, M. and Vougioukas, K. and He, S. and Zieba, M. and Petridis, S. and Pantic, M.",
        TITLE = "Diffused Heads: Diffusion Models Beat GANs on Talking-Face Generation",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5089-5098",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106546"}

@inproceedings{bb109874,
        AUTHOR = "Ni, H.M. and Liu, J.C. and Xue, Y. and Huang, S.X.",
        TITLE = "3D-Aware Talking-Head Video Motion Transfer",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "4942-4952",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106547"}

@inproceedings{bb109875,
        AUTHOR = "Zhao, L. and Li, H.X. and Ning, X.F. and Jiang, X.",
        TITLE = "THInImg: Cross-modal Steganography for Presenting Talking Heads in
Images",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5541-5550",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106548"}

@inproceedings{bb109876,
        AUTHOR = "Liu, Y.F. and Lin, L.J. and Yu, F. and Zhou, C.Y. and Li, Y.",
        TITLE = "MODA: Mapping-Once Audio-driven Portrait Animation with Dual
Attentions",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "22963-22972",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106549"}

@inproceedings{bb109877,
        AUTHOR = "Zheng, J.L. and Jang, Y. and Papaioannou, A. and Kampouris, C. and Potamias, R.A. and Papantoniou, F.P. and Galanakis, E. and Leonardis, A. and Zafeiriou, S.",
        TITLE = "ILSH: The Imperial Light-Stage Head Dataset for Human Head View
Synthesis",
        BOOKTITLE = RHWC23,
        YEAR = "2023",
        PAGES = "1104-1112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106550"}

@inproceedings{bb109878,
        AUTHOR = "Muaz, U. and Jang, W. and Tripathi, R. and Mani, S. and Ouyang, W.B. and Gadde, R.T. and Gecer, B. and Elizondo, S. and Madad, R. and Nair, N.",
        TITLE = "SIDGAN: High-Resolution Dubbed Video Generation via Shift-Invariant
Learning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7799-7808",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106551"}

@inproceedings{bb109879,
        AUTHOR = "Li, W.C. and Zhang, L.H. and Wang, D. and Zhao, B. and Wang, Z.G. and Chen, M. and Zhang, B. and Wang, Z.J. and Bo, L. and Li, X.L.",
        TITLE = "One-Shot High-Fidelity Talking-Head Synthesis with Deformable Neural
Radiance Field",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "17969-17978",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106552"}

@inproceedings{bb109880,
        AUTHOR = "Jeong, Y.J. and Ryoo, W. and Lee, S.H. and Seo, D. and Byeon, W. and Kim, S. and Kim, J.",
        TITLE = "The Power of Sound (TPoS): Audio Reactive Video Generation with
Stable Diffusion",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7788-7798",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106553"}

@inproceedings{bb109881,
        AUTHOR = "Gururani, S. and Mallya, A. and Wang, T.C. and Valle, R. and Liu, M.Y.",
        TITLE = "SPACE: Speech-driven Portrait Animation with Controllable Expression",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "20857-20866",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106554"}

@inproceedings{bb109882,
        AUTHOR = "Thambiraja, B. and Habibie, I. and Aliakbarian, S. and Cosker, D. and Theobalt, C. and Thies, J.",
        TITLE = "Imitator: Personalized Speech-driven 3D Facial Animation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "20564-20574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106555"}

@inproceedings{bb109883,
        AUTHOR = "Yang, P. and Wei, H. and Zhong, Y.C. and Wang, Z.S.",
        TITLE = "Semi-supervised Speech-driven 3D Facial Animation via Cross-modal
Encoding",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "20975-20984",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106556"}

@inproceedings{bb109884,
        AUTHOR = "Wu, X.Z. and Hu, P.F. and Wu, Y. and Lyu, X.Y. and Cao, Y.P. and Shan, Y. and Yang, W.M. and Sun, Z.Q. and Qi, X.J.",
        TITLE = "Speech2Lip: High-fidelity Speech to Lip Generation by Learning from a
Short Video",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "22111-22120",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106557"}

@inproceedings{bb109885,
        AUTHOR = "He, S. and He, H.N. and Yang, S. and Wu, X.Y. and Xia, P.C. and Yin, B. and Liu, C. and Dai, L.R. and Xu, C.",
        TITLE = "Speech4Mesh: Speech-Assisted Monocular 3D Facial Reconstruction for
Speech-Driven 3D Facial Animation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "14146-14156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106558"}

@inproceedings{bb109886,
        AUTHOR = "Choi, J. and Hong, J. and Ro, Y.M.",
        TITLE = "DiffV2S: Diffusion-based Video-to-Speech Synthesis with Vision-guided
Speaker Embedding",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7778-7787",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106559"}

@inproceedings{bb109887,
        AUTHOR = "Gong, Y. and Zhang, Y. and Cun, X.D. and Yin, F. and Fan, Y.B. and Wang, X. and Wu, B.Y. and Yang, Y.",
        TITLE = "ToonTalker: Cross-Domain Face Reenactment",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7656-7666",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106560"}

@inproceedings{bb109888,
        AUTHOR = "Yu, Z.T. and Yin, Z.X. and Zhou, D.Y. and Wang, D. and Wong, F. and Wang, B.Y.",
        TITLE = "Talking Head Generation with Probabilistic Audio-to-Visual Diffusion
Priors",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "7611-7621",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106561"}

@inproceedings{bb109889,
        AUTHOR = "Oorloff, T. and Yacoob, Y.",
        TITLE = "Expressive Talking Head Video Encoding in StyleGAN2 Latent Space",
        BOOKTITLE = CVEU23,
        YEAR = "2023",
        PAGES = "2990-2999",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106562"}

@inproceedings{bb109890,
        AUTHOR = "Chen, L.Y. and Wu, Z.Y. and Li, R. and Bao, W.H. and Ling, J. and Tan, X. and Zhao, S.",
        TITLE = "VAST: Vivify Your Talking Avatar via Zero-Shot Expressive Facial
Style Transfer",
        BOOKTITLE = CVEU23,
        YEAR = "2023",
        PAGES = "2969-2979",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106563"}

@inproceedings{bb109891,
        AUTHOR = "Hong, F.T. and Xu, D.",
        TITLE = "Implicit Identity Representation Conditioned Memory Compensation
Network for Talking Head Video Generation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "23005-23015",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106564"}

@inproceedings{bb109892,
        AUTHOR = "Nocentini, F. and Ferrari, C. and Berretti, S.",
        TITLE = "Learning Landmarks Motion from Speech for Speaker-agnostic 3d Talking
Heads Generation",
        BOOKTITLE = CIAP23,
        YEAR = "2023",
        PAGES = "I:340-351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106565"}

@inproceedings{bb109893,
        AUTHOR = "Wang, Q. and Li, D. and Liao, L. and Song, H. and Li, W. and Xiao, J.",
        TITLE = "ASVFI: Audio-Driven Speaker Video Frame Interpolation",
        BOOKTITLE = ICIP23,
        YEAR = "2023",
        PAGES = "3200-3204",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106566"}

@inproceedings{bb109894,
        AUTHOR = "Zeng, B. and Liu, X.H. and Gao, S.C. and Liu, B. and Li, H. and Liu, J.Z. and Zhang, B.C.",
        TITLE = "Face Animation with an Attribute-Guided Diffusion Model",
        BOOKTITLE = GCV23,
        YEAR = "2023",
        PAGES = "628-637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106567"}

@inproceedings{bb109895,
        AUTHOR = "Shen, S. and Zhao, W.L. and Meng, Z. and Li, W. and Zhu, Z. and Zhou, J. and Lu, J.W.",
        TITLE = "DiffTalk: Crafting Diffusion Models for Generalized Audio-Driven
Portraits Animation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "1982-1991",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106568"}

@inproceedings{bb109896,
        AUTHOR = "Zhang, B. and Qi, C.Y. and Zhang, P. and Zhang, B. and Wu, H.T. and Chen, D. and Chen, Q.F. and Wang, Y. and Wen, F.",
        TITLE = "MetaPortrait: Identity-Preserving Talking Head Generation with Fast
Personalized Adaptation",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "22096-22105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106569"}

@inproceedings{bb109897,
        AUTHOR = "Vahdati, D.S. and Nguyen, T.D. and Stamm, M.C.",
        TITLE = "Defending Low-Bandwidth Talking Head Videoconferencing Systems From
Real-Time Puppeteering Attacks",
        BOOKTITLE = WMF23,
        YEAR = "2023",
        PAGES = "983-992",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106570"}

@inproceedings{bb109898,
        AUTHOR = "Wang, D. and Deng, Y. and Yin, Z.X. and Shum, H.Y. and Wang, B.Y.",
        TITLE = "Progressive Disentangled Representation Learning for Fine-Grained
Controllable Talking Head Synthesis",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "17979-17989",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106571"}

@inproceedings{bb109899,
        AUTHOR = "Wang, J.Y. and Zhao, K. and Zhang, S.W. and Zhang, Y.Y. and Shen, Y.J. and Zhao, D.L. and Zhou, J.",
        TITLE = "LipFormer: High-fidelity and Generalizable Talking Face Generation
with A Pre-learned Facial Codebook",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "13844-13853",
        BIBSOURCE = "http://www.visionbib.com/bibliography/describe499.html#TT106572"}

Last update:Feb 26, 2026 at 10:58:24