@article{bb375600,
        AUTHOR = "Wang, H. and Yang, Y.F. and Liu, S. and Li, J. and Meng, L. and Liu, Y.Q. and Zhou, J.M. and Sun, H.Q. and Lu, Y. and Qin, Y.",
        TITLE = "StreamMel: Real-Time Zero-Shot Text-to-Speech Via Interleaved
Continuous Autoregressive Modeling",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "3530-3534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369703"}

@article{bb375601,
        AUTHOR = "Li, L. and Cong, G.X. and Qi, Y.K. and Zha, Z.J. and Wu, Q. and Sheng, Q.Z. and Huang, Q.M. and Yang, M.H.",
        TITLE = "Dubbing Movies via Hierarchical Phoneme Modeling and Acoustic
Diffusion Denoising",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "10361-10377",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369704"}

@article{bb375602,
        AUTHOR = "Gao, X.X. and Zhang, H. and Chen, N.F.",
        TITLE = "Prompt-Unseen-Emotion: Mixed Emotional Speech Synthesis With
Prompt-LLM Contextual Knowledge",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "4259-4263",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369705"}

@article{bb375603,
        AUTHOR = "Lee, K. and Hong, S. and Chun, S.Y.",
        TITLE = "Robust watermarks for audio diffusion models by quadrature amplitude
modulation",
        JOURNAL = PRL,
        VOLUME = "198",
        YEAR = "2025",
        PAGES = "22-28",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369706"}

@article{bb375604,
        AUTHOR = "Inoue, S. and Zhou, K. and Wang, S. and Li, H.Z.",
        TITLE = "Hierarchical Control of Emotion Rendering in Speech Synthesis",
        JOURNAL = AffCom,
        VOLUME = "16",
        YEAR = "2025",
        NUMBER = "4",
        MONTH = "October",
        PAGES = "3316-3328",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369707"}

@article{bb375605,
        AUTHOR = "Cha, H. and Um, S. and Kim, M. and Kim, C. and Lee, S. and Kang, H.G.",
        TITLE = "Content-Aware Style Augmentation for Zero-Shot Voice Conversion With
Short Target Speech",
        JOURNAL = SPLetters,
        VOLUME = "33",
        YEAR = "2026",
        PAGES = "66-70",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369708"}

@inproceedings{bb375606,
        AUTHOR = "Liu, J. and Geddes, J. and Guo, Z.Y. and Jiang, H. and Nandwana, M.K.",
        TITLE = "Smooth Cache: A Universal Inference Acceleration Technique for
Diffusion Transformers",
        BOOKTITLE = LargeVM25,
        YEAR = "2025",
        PAGES = "3220-3229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369709"}

@inproceedings{bb375607,
        AUTHOR = "Kushwaha, S.S. and Tian, Y.P.",
        TITLE = "VinTAGe: Joint Video and Text Conditioning for Holistic Audio
Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "13529-13539",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369710"}

@inproceedings{bb375608,
        AUTHOR = "Kim, J.H. and Choi, J. and Kim, J.H. and Jung, C. and Chung, J.S.",
        TITLE = "From Faces to Voices: Learning Hierarchical Representations for
High-quality Video-to-Speech",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15874-15884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369711"}

@inproceedings{bb375609,
        AUTHOR = "Cong, G.X. and Pan, J. and Li, L. and Qi, Y.K. and Peng, Y.X. and van den Hengel, A.J. and Yang, J. and Huang, Q.M.",
        TITLE = "EmoDubber: Towards High Quality and Emotion Controllable Movie
Dubbing",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15863-15873",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369712"}

@inproceedings{bb375610,
        AUTHOR = "Zhang, Z.D. and Li, L. and Yan, C.G. and Liu, C.S. and van den Hengel, A.J. and Qi, Y.K.",
        TITLE = "Prosody-Enhanced Acoustic Pre-training and Acoustic-Disentangled
Prosody Adapting for Movie Dubbing",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "172-182",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369713"}

@inproceedings{bb375611,
        AUTHOR = "Rai, A. and Sridhar, S.",
        TITLE = "EgoSonics: Generating Synchronized Audio for Silent Egocentric Videos",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "4935-4946",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369714"}

@inproceedings{bb375612,
        AUTHOR = "Yadav, A.K.S. and Bhagtani, K. and Salvi, D. and Bestagini, P. and Delp, E.J.",
        TITLE = "FairSSD: Understanding Bias in Synthetic Speech Detectors",
        BOOKTITLE = WMF24,
        YEAR = "2024",
        PAGES = "4418-4428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369715"}

@inproceedings{bb375613,
        AUTHOR = "Cuccovillo, L. and Gerhardt, M. and Aichroth, P.",
        TITLE = "Audio Transformer for Synthetic Speech Detection via Multi-Formant
Analysis",
        BOOKTITLE = WMF24,
        YEAR = "2024",
        PAGES = "4409-4417",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369716"}

@inproceedings{bb375614,
        AUTHOR = "Cong, G.X. and Li, L. and Qi, Y.K. and Zha, Z.J. and Wu, Q. and Wang, W.Y. and Jiang, B. and Yang, M.H. and Huang, Q.M.",
        TITLE = "Learning to Dub Movies via Hierarchical Prosody Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "14687-14697",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369717"}

@inproceedings{bb375615,
        AUTHOR = "Hsu, W.N. and Remez, T. and Shi, B. and Donley, J. and Adi, Y.",
        TITLE = "ReVISE: Self-Supervised Speech Resynthesis with Visual Input for
Universal and Generalized Speech Regeneration",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18796-18806",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369718"}

@inproceedings{bb375616,
        AUTHOR = "Sun, C.Z. and Jia, S. and Hou, S.W. and Lyu, S.W.",
        TITLE = "AI-Synthesized Voice Detection Using Neural Vocoder Artifacts",
        BOOKTITLE = WMF23,
        YEAR = "2023",
        PAGES = "904-912",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369719"}

@inproceedings{bb375617,
        AUTHOR = "Noufi, C. and May, L. and Berger, J.",
        TITLE = "The Role of Vocal Persona in Natural and Synthesized Speech",
        BOOKTITLE = FG23,
        YEAR = "2023",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369720"}

@inproceedings{bb375618,
        AUTHOR = "Hwang, I.S. and Lee, S.H. and Lee, S.W.",
        TITLE = "StyleVC: Non-Parallel Voice Conversion with Adversarial Style
Generalization",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "23-30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369721"}

@inproceedings{bb375619,
        AUTHOR = "Wang, W.B. and Song, Y. and Jha, S.",
        TITLE = "Autolv: Automatic Lecture Video Generator",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "1086-1090",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369722"}

@inproceedings{bb375620,
        AUTHOR = "Borzi, S. and Giudice, O. and Stanco, F. and Allegra, D.",
        TITLE = "Is synthetic voice detection research going into the right direction?",
        BOOKTITLE = WMF22,
        YEAR = "2022",
        PAGES = "71-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369723"}

@inproceedings{bb375621,
        AUTHOR = "Hassid, M. and Ramanovich, M.T. and Shillingford, B. and Wang, M. and Jia, Y. and Remez, T.",
        TITLE = "More than Words: In-the-Wild Visually-Driven Prosody for
Text-to-Speech",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10577-10587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369724"}

@inproceedings{bb375622,
        AUTHOR = "Kwak, I.Y. and Kwag, S. and Lee, J. and Huh, J.H. and Lee, C.H. and Jeon, Y.B. and Hwang, J.H. and Yoon, J.W.",
        TITLE = "ResMax: Detecting Voice Spoofing Attacks with Residual Network and
Max Feature Map",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "4837-4844",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369725"}

@inproceedings{bb375623,
        AUTHOR = "Wang, D.H. and Wang, R. and Dong, L. and Yan, D. and Ren, Y.M.",
        TITLE = "Efficient Generation of Speech Adversarial Examples with Generative
Model",
        BOOKTITLE = IWDW20,
        YEAR = "2020",
        PAGES = "251-264",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369726"}

@inproceedings{bb375624,
        AUTHOR = "Zhou, H. and Liu, Z. and Xu, X. and Luo, P. and Wang, X.",
        TITLE = "Vision-Infused Deep Audio Inpainting",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "283-292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369727"}

@inproceedings{bb375625,
        AUTHOR = "Bailer, W. and Wijnants, M. and Lievens, H. and Claes, S.",
        TITLE = "Multimedia Analytics Challenges and Opportunities for Creating
Interactive Radio Content",
        BOOKTITLE = MMMod20,
        YEAR = "2020",
        PAGES = "II:375-387",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369728"}

@inproceedings{bb375626,
        AUTHOR = "Huang, T. and Wang, H.X. and Chen, Y. and He, P.S.",
        TITLE = "GRU-SVM Model for Synthetic Speech Detection",
        BOOKTITLE = IWDW19,
        YEAR = "2019",
        PAGES = "115-125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369729"}

@inproceedings{bb375627,
        AUTHOR = "Wong, A. and Xu, A. and Dudek, G.",
        TITLE = "Investigating Trust Factors in Human-Robot Shared Control:
Implicit Gender Bias Around Robot Voice",
        BOOKTITLE = CRV19,
        YEAR = "2019",
        PAGES = "195-200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369730"}

@inproceedings{bb375628,
        AUTHOR = "Xiao, L. and Wang, Z.",
        TITLE = "Dense Convolutional Recurrent Neural Network for Generalized Speech
Animation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "633-638",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369731"}

@inproceedings{bb375629,
        AUTHOR = "Shah, N.J. and Patil, H.A.",
        TITLE = "Analysis of Features and Metrics for Alignment in Text-Dependent Voice
Conversion",
        BOOKTITLE = PReMI17,
        YEAR = "2017",
        PAGES = "299-307",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369732"}

@inproceedings{bb375630,
        AUTHOR = "Rybarova, R. and Drozd, I. and Rozinaj, G.",
        TITLE = "GUI for interactive speech synthesis",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369733"}

@inproceedings{bb375631,
        AUTHOR = "Coto Jimenez, M. and Goddard Close, J.",
        TITLE = "LSTM Deep Neural Networks Postfiltering for Improving the Quality of
Synthetic Voices",
        BOOKTITLE = MCPR16,
        YEAR = "2016",
        PAGES = "280-289",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369734"}

@inproceedings{bb375632,
        AUTHOR = "Vasek, M. and Rozinaj, G. and Rybarova, R.",
        TITLE = "Letter-To-Sound conversion for speech synthesizer",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369735"}

@inproceedings{bb375633,
        AUTHOR = "Rybarova, R. and del Corral, G. and Rozinaj, G.",
        TITLE = "Diphone spanish text-to-speech synthesizer",
        BOOKTITLE = WSSIP15,
        YEAR = "2015",
        PAGES = "121-124",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369736"}

@inproceedings{bb375634,
        AUTHOR = "Verma, R. and Sarkar, P. and Rao, K.S.",
        TITLE = "Conversion of neutral speech to storytelling style speech",
        BOOKTITLE = ICAPR15,
        YEAR = "2015",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369737"}

@inproceedings{bb375635,
        AUTHOR = "Narendra, N.P. and Rao, K.S.",
        TITLE = "Optimal residual frame based source modeling for HMM-based speech
synthesis",
        BOOKTITLE = ICAPR15,
        YEAR = "2015",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369738"}

@inproceedings{bb375636,
        AUTHOR = "Wang, Y. and Tao, J.H. and Yang, M.H. and Li, Y.",
        TITLE = "Extended Decision Tree with or Relationship for HMM-Based Speech
Synthesis",
        BOOKTITLE = ACPR13,
        YEAR = "2013",
        PAGES = "225-229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369739"}

@inproceedings{bb375637,
        AUTHOR = "Gao, L. and Yu, H.Z. and Zhang, J.H. and Fang, H.P.",
        TITLE = "Research on HMM_based speech synthesis for Lhasa dialect",
        BOOKTITLE = IASP11,
        YEAR = "2011",
        PAGES = "429-433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369740"}

@inproceedings{bb375638,
        AUTHOR = "Chakraborty, R. and Garain, U.",
        TITLE = "Role of Synthetically Generated Samples on Speech Recognition in a
Resource-Scarce Language",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "1618-1621",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369741"}

@inproceedings{bb375639,
        AUTHOR = "Rao, K.S. and Maity, S. and Taru, A. and Koolagudi, S.G.",
        TITLE = "Unit Selection Using Linguistic, Prosodic and Spectral Distance for
Developing Text-to-Speech System in Hindi",
        BOOKTITLE = PReMI09,
        YEAR = "2009",
        PAGES = "531-536",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369742"}

@inproceedings{bb375640,
        AUTHOR = "Bahrampour, A. and Barkhoda, W. and Azami, B.Z.",
        TITLE = "Implementation of Three Text to Speech Systems for Kurdish Language",
        BOOKTITLE = CIARP09,
        YEAR = "2009",
        PAGES = "321-328",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369743"}

@inproceedings{bb375641,
        AUTHOR = "Shirbahadurkar, S.D. and Bormane, D.S.",
        TITLE = "Marathi Language Speech Synthesizer Using Concatenative Synthesis
Strategy (Spoken in Maharashtra, India)",
        BOOKTITLE = ICMV09,
        YEAR = "2009",
        PAGES = "181-185",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369744"}

@inproceedings{bb375642,
        AUTHOR = "Tuckova, J. and Holub, J. and Dubeda, T.",
        TITLE = "Technical and Phonetic Aspects of Speech Quality Assessment:
The Case of Prosody Synthesis",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "126-132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369745"}

@inproceedings{bb375643,
        AUTHOR = "Bauer, D. and Kannampuzha, J. and Kroger, B.J.",
        TITLE = "Articulatory Speech Re-synthesis:
Profiting from Natural Acoustic Speech Data",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "344-355",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369746"}

@inproceedings{bb375644,
        AUTHOR = "Gu, H.Y. and Cai, C.L. and Cai, S.F.",
        TITLE = "An HNM-Based Speaker-Nonspecific Timbre Transformation Scheme for
Speech Synthesis",
        BOOKTITLE = CISP09,
        YEAR = "2009",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT369747"}

@article{bb375645,
        AUTHOR = "Lung, S.Y. and Chen, C.C.T.",
        TITLE = "A new approach for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "33",
        YEAR = "2000",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1401-1403",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369748"}

@article{bb375646,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Multi-resolution form of SVD for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "35",
        YEAR = "2002",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1637-1639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369749"}

@article{bb375647,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Further reduced form of wavelet feature for text independent speaker
recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1565-1566",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369750"}

@article{bb375648,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Feature extracted from wavelet eigenfunction estimation for
text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1543-1544",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369751"}

@article{bb375649,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Wavelet feature domain adaptive noise reduction using learning
algorithm for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2603-2606",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369752"}

@article{bb375650,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Efficient text independent speaker recognition with wavelet feature
selection based multilayered neural network using supervised learning
algorithm",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "3616-3620",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369753"}

@article{bb375651,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Distributed genetic algorithm for Gaussian mixture model based speaker
identification",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2479-2481",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369754"}

@article{bb375652,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Adaptive fuzzy wavelet algorithm for text-independent speaker
recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2095-2096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369755"}

@article{bb375653,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Wavelet feature selection based neural networks with application to the
text independent speaker identification",
        JOURNAL = PR,
        VOLUME = "39",
        YEAR = "2006",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1518-1521",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369756"}

@article{bb375654,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Feature extracted from wavelet decomposition using biorthogonal Riesz
basis for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "41",
        YEAR = "2008",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "3068-3070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369757"}

@article{bb375655,
        AUTHOR = "Chen, K. and Wu, T.Y. and Zhang, H.J.",
        TITLE = "On the use of nearest feature line for speaker identification",
        JOURNAL = PRL,
        VOLUME = "23",
        YEAR = "2002",
        NUMBER = "14",
        MONTH = "December",
        PAGES = "1735-1746",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369758"}

@article{bb375656,
        AUTHOR = "Ramachandran, R.P. and Farrell, K.R. and Ramachandran, R. and Mammone, R.J.",
        TITLE = "Speaker recognition:
general classifier approaches and data fusion methods",
        JOURNAL = PR,
        VOLUME = "35",
        YEAR = "2002",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "2801-2821",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369759"}

@article{bb375657,
        AUTHOR = "Chen, K.",
        TITLE = "Towards better making a decision in speaker verification",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "329-346",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369760"}

@article{bb375658,
        AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C. and Alba Castro, J.L.",
        TITLE = "On combining classifiers for speaker authentication",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "347-359",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369761"}

@article{bb375659,
        AUTHOR = "Damper, R.I. and Higgins, J.E.",
        TITLE = "Improving speaker identification in noise by subband processing and
decision fusion",
        JOURNAL = PRL,
        VOLUME = "24",
        YEAR = "2003",
        NUMBER = "13",
        MONTH = "September",
        PAGES = "2167-2173",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369762"}

@article{bb375660,
        AUTHOR = "Besacier, L. and Mayorga, P. and Bonastre, J.F. and Fredouille, C. and Meignier, S.",
        TITLE = "Overview of compression and packet loss effects in speech biometrics",
        JOURNAL = VISP,
        VOLUME = "150",
        YEAR = "2003",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "372-376",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369763"}

@inproceedings{bb375661,
        AUTHOR = "Besacier, L. and Bonastre, J.F.",
        TITLE = "Time and frequency pruning for speaker identification",
        BOOKTITLE = ICPR98,
        YEAR = "1998",
        PAGES = "Vol II: 1619-1621",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369764"}

@article{bb375662,
        AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C.",
        TITLE = "Application of fusion techniques to speaker authentication over ip
networks",
        JOURNAL = VISP,
        VOLUME = "150",
        YEAR = "2003",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "377-382",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369765"}

@article{bb375663,
        AUTHOR = "Chen, C.C.T. and Chen, C.T. and Hou, C.K.",
        TITLE = "Speaker identification using hybrid Karhunen-Loeve transform and
Gaussian mixture model approach",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1073-1075",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369766"}

@article{bb375664,
        AUTHOR = "Lee, K.Y.",
        TITLE = "Local fuzzy PCA based GMM with dimension reduction on speaker
identification",
        JOURNAL = PRL,
        VOLUME = "25",
        YEAR = "2004",
        NUMBER = "16",
        MONTH = "December",
        PAGES = "1811-1817",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369767"}

@article{bb375665,
        AUTHOR = "Mashao, D.J. and Skosan, M.",
        TITLE = "Combining classifier decisions for robust speaker identification",
        JOURNAL = PR,
        VOLUME = "39",
        YEAR = "2006",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "147-155",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369768"}

@article{bb375666,
        AUTHOR = "Skosan, M. and Mashao, D.J.",
        TITLE = "Modified Segmental Histogram Equalization for robust speaker
verification",
        JOURNAL = PRL,
        VOLUME = "27",
        YEAR = "2006",
        NUMBER = "5",
        MONTH = "April",
        PAGES = "479-486",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369769"}

@article{bb375667,
        AUTHOR = "Ariyaeeinia, A.M. and Fortuna, J. and Sivakumaran, P. and Malegaonkar, A.",
        TITLE = "Verification effectiveness in open-set speaker identification",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "5",
        MONTH = "October",
        PAGES = "618-624",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369770"}

@article{bb375668,
        AUTHOR = "Zhou, G. and Mikhael, W.B.",
        TITLE = "Speaker identification based on adaptive discriminative vector
quantisation",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "754-760",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369771"}

@article{bb375669,
        AUTHOR = "Park, C.M. and Thapa, D. and Wang, G.N.",
        TITLE = "Speech authentication system using digital watermarking and pattern
recovery",
        JOURNAL = PRL,
        VOLUME = "28",
        YEAR = "2007",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "931-938",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369772"}

@article{bb375670,
        AUTHOR = "Faundez Zanuy, M. and Hagmuller, M. and Kubin, G.",
        TITLE = "Speaker identification security improvement by means of speech
watermarking",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3027-3034",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369773"}

@article{bb375671,
        AUTHOR = "Chetouani, M. and Faundez Zanuy, M. and Gas, B. and Zarader, J.L.",
        TITLE = "Investigation on LP-residual representations for speaker identification",
        JOURNAL = PR,
        VOLUME = "42",
        YEAR = "2009",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "487-494",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369774"}

@article{bb375672,
        AUTHOR = "Kinnunen, T. and Saastamoinen, J. and Hautamaki, V. and Vinni, M. and Franti, P.",
        TITLE = "Comparative evaluation of maximum a Posteriori vector quantization and
Gaussian mixture models in speaker verification",
        JOURNAL = PRL,
        VOLUME = "30",
        YEAR = "2009",
        NUMBER = "4",
        MONTH = "March",
        PAGES = "341-347",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369775"}

@article{bb375673,
        AUTHOR = "Chao, Y.H. and Tsai, W.H. and Wang, H.M. and Chang, R.C.",
        TITLE = "Improving the characterization of the alternative hypothesis via
minimum verification error training with applications to speaker
verification",
        JOURNAL = PR,
        VOLUME = "42",
        YEAR = "2009",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1351-1360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369776"}

@article{bb375674,
        AUTHOR = "Temko, A. and Nadeu, C.",
        TITLE = "Acoustic event detection in meeting-room environments",
        JOURNAL = PRL,
        VOLUME = "30",
        YEAR = "2009",
        NUMBER = "14",
        MONTH = "October",
        PAGES = "1281-1288",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369777"}

@article{bb375675,
        AUTHOR = "Kim, S. and Ji, M.Y. and Kim, H.",
        TITLE = "Robust speaker recognition based on filtering in autocorrelation domain
and sub-band feature recombination",
        JOURNAL = PRL,
        VOLUME = "31",
        YEAR = "2010",
        NUMBER = "7",
        MONTH = "May",
        PAGES = "593-599",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369778"}

@article{bb375676,
        AUTHOR = "Li, H. and Ma, B. and Lee, K.A.",
        TITLE = "Spoken Language Recognition: From Fundamentals to Practice",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1136-1159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369779"}

@article{bb375677,
        AUTHOR = "Li, H. and Ma, B.",
        TITLE = "TechWare: Speaker and Spoken Language Recognition Resources",
        JOURNAL = SPMag,
        VOLUME = "27",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "139-142",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369780"}

@article{bb375678,
        AUTHOR = "Ajmera, P.K. and Jadhav, D.V. and Holambe, R.S.",
        TITLE = "Text-independent speaker identification using Radon and discrete cosine
transforms based features from speech spectrogram",
        JOURNAL = PR,
        VOLUME = "44",
        YEAR = "2011",
        NUMBER = "10-11",
        MONTH = "October",
        PAGES = "2749-2759",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369781"}

@article{bb375679,
        AUTHOR = "Kinnunen, T. and Sidoroff, I. and Tuononen, M. and Franti, P.",
        TITLE = "Comparison of clustering methods:
A case study of text-independent speaker modeling",
        JOURNAL = PRL,
        VOLUME = "32",
        YEAR = "2011",
        NUMBER = "13",
        MONTH = "October",
        PAGES = "1604-1617",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369782"}

@inproceedings{bb375680,
        AUTHOR = "Kinnunen, T. and Karpov, E. and Franti, P.",
        TITLE = "A Speaker Pruning Algorithm for Real-Time Speaker Identification",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "639-646",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369783"}

@inproceedings{bb375681,
        AUTHOR = "Kinnunen, T. and Franti, P.",
        TITLE = "Speaker Discriminative Weighting Method for VQ-Based Speaker
Identification",
        BOOKTITLE = AVBPA01,
        YEAR = "2001",
        PAGES = "150",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369784"}

@article{bb375682,
        AUTHOR = "Zao, L. and Coelho, R.",
        TITLE = "Colored Noise Based Multicondition Training Technique for Robust
Speaker Identification",
        JOURNAL = SPLetters,
        VOLUME = "18",
        YEAR = "2011",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "675-678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369785"}

@article{bb375683,
        AUTHOR = "Hanilci, C. and Kinnunen, T. and Ertas, F. and Saeidi, R. and Pohjalainen, J. and Alku, P.",
        TITLE = "Regularized All-Pole Models for Speaker Verification Under Noisy
Environments",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "163-166",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369786"}

@article{bb375684,
        AUTHOR = "Salamin, H. and Vinciarelli, A.",
        TITLE = "Automatic Role Recognition in Multiparty Conversations: An Approach
Based on Turn Organization, Prosody, and Conditional Random Fields",
        JOURNAL = MultMed,
        VOLUME = "14",
        YEAR = "2012",
        NUMBER = "2",
        PAGES = "338-345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369787"}

@article{bb375685,
        AUTHOR = "Tang, H. and Chu, S. and Hasegawa Johnson, M. and Huang, T.S.",
        TITLE = "Partially Supervised Speaker Clustering",
        JOURNAL = PAMI,
        VOLUME = "34",
        YEAR = "2012",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "959-971",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369788"}

@article{bb375686,
        AUTHOR = "Montalvao, J. and Araujo, M.R.R.",
        TITLE = "Is masking a relevant aspect lacking in MFCC? A speaker verification
perspective",
        JOURNAL = PRL,
        VOLUME = "33",
        YEAR = "2012",
        NUMBER = "16",
        MONTH = "December",
        PAGES = "2156-2165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369789"}

@article{bb375687,
        AUTHOR = "Garimella, S. and Mallidi, S.H. and Hermansky, H.",
        TITLE = "Regularized Auto-Associative Neural Networks for Speaker Verification",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "841-844",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369790"}

@article{bb375688,
        AUTHOR = "Sahidullah, M. and Saha, G.",
        TITLE = "A Novel Windowing Technique for Efficient Computation of MFCC for
Speaker Recognition",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "149-152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369791"}

@article{bb375689,
        AUTHOR = "Vallet, F. and Essid, S. and Carrive, J.",
        TITLE = "A Multimodal Approach to Speaker Diarization on TV Talk-Shows",
        JOURNAL = MultMed,
        VOLUME = "15",
        YEAR = "2013",
        NUMBER = "3",
        PAGES = "509-520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369792"}

@article{bb375690,
        AUTHOR = "Inthavisas, K. and Lopresti, D.",
        TITLE = "Secure speech biometric templates for user authentication",
        JOURNAL = IET-Bio,
        VOLUME = "1",
        YEAR = "2012",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "46-54",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369793"}

@article{bb375691,
        AUTHOR = "Pillay, S. and Ariyaeeinia, A. and Sivakumaran, P. and Pawlewski, M.",
        TITLE = "Effective speaker verification via dynamic mismatch compensation",
        JOURNAL = IET-Bio,
        VOLUME = "1",
        YEAR = "2012",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "130-135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369794"}

@article{bb375692,
        AUTHOR = "Bhardwaj, S. and Srivastava, S. and Hanmandlu, M. and Gupta, J.R.P.",
        TITLE = "GFM-Based Methods for Speaker Identification",
        JOURNAL = Cyber,
        VOLUME = "43",
        YEAR = "2013",
        NUMBER = "3",
        PAGES = "1047-1058",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369795"}

@article{bb375693,
        AUTHOR = "Pekhovsky, T. and Sizov, A.",
        TITLE = "Comparison between supervised and unsupervised learning of
probabilistic linear discriminant analysis mixture models for speaker
verification",
        JOURNAL = PRL,
        VOLUME = "34",
        YEAR = "2013",
        NUMBER = "11",
        MONTH = "August",
        PAGES = "1307-1313",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369796"}

@article{bb375694,
        AUTHOR = "Yaman, S. and Pelecanos, J.",
        TITLE = "Using Polynomial Kernel Support Vector Machines for Speaker
Verification",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "9",
        PAGES = "901-904",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369797"}

@article{bb375695,
        AUTHOR = "Bin Amin, T. and Marziliano, P. and German, J.S.",
        TITLE = "Glottal and Vocal Tract Characteristics of Voice Impersonators",
        JOURNAL = MultMed,
        VOLUME = "16",
        YEAR = "2014",
        NUMBER = "3",
        MONTH = "April",
        PAGES = "668-678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369798"}

@article{bb375696,
        AUTHOR = "Sarkar, A.K. and Do, C.T. and Le, V.B. and Barras, C.",
        TITLE = "Combination of Cepstral and Phonetically Discriminative Features for
Speaker Verification",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1040-1044",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369799"}

@article{bb375697,
        AUTHOR = "Yang, H. and Xu, Y. and Huang, H. and Zhou, R. and Yan, Y.",
        TITLE = "Voice biometrics using linear Gaussian model",
        JOURNAL = IET-Bio,
        VOLUME = "3",
        YEAR = "2014",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "9-15",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369800"}

@article{bb375698,
        AUTHOR = "Ribas Gonzalez, D. and Calvo de Lara, J.R.",
        TITLE = "Feature classification criterion for missing features mask estimation
in robust speaker recognition",
        JOURNAL = SIViP,
        VOLUME = "8",
        YEAR = "2014",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "365-375",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369801"}

@article{bb375699,
        AUTHOR = "Hernandez Sierra, G. and Calvo, J.R. and Bonastre, J.F. and Bousquet, P.M.",
        TITLE = "Session compensation using binary speech representation for speaker
recognition",
        JOURNAL = PRL,
        VOLUME = "49",
        YEAR = "2014",
        NUMBER = "1",
        PAGES = "17-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT369802"}

Last update:Feb 17, 2026 at 20:06:16