@article{bb378300,
        AUTHOR = "Haji Ali, M. and Menapace, W. and Siarohin, A. and Balakrishnan, G. and Ordonez, V.",
        TITLE = "Taming Data and Transformers for Audio Generation",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372395"}

@inproceedings{bb378301,
        AUTHOR = "Liu, J. and Geddes, J. and Guo, Z.Y. and Jiang, H. and Nandwana, M.K.",
        TITLE = "Smooth Cache: A Universal Inference Acceleration Technique for
Diffusion Transformers",
        BOOKTITLE = LargeVM25,
        YEAR = "2025",
        PAGES = "3220-3229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372396"}

@inproceedings{bb378302,
        AUTHOR = "Kushwaha, S.S. and Tian, Y.P.",
        TITLE = "VinTAGe: Joint Video and Text Conditioning for Holistic Audio
Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "13529-13539",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372397"}

@inproceedings{bb378303,
        AUTHOR = "Kim, J.H. and Choi, J. and Kim, J.H. and Jung, C. and Chung, J.S.",
        TITLE = "From Faces to Voices: Learning Hierarchical Representations for
High-quality Video-to-Speech",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15874-15884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372398"}

@inproceedings{bb378304,
        AUTHOR = "Cong, G.X. and Pan, J. and Li, L. and Qi, Y.K. and Peng, Y.X. and van den Hengel, A.J. and Yang, J. and Huang, Q.M.",
        TITLE = "EmoDubber: Towards High Quality and Emotion Controllable Movie
Dubbing",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15863-15873",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372399"}

@inproceedings{bb378305,
        AUTHOR = "Zhang, Z.D. and Li, L. and Yan, C.G. and Liu, C.S. and van den Hengel, A.J. and Qi, Y.K.",
        TITLE = "Prosody-Enhanced Acoustic Pre-training and Acoustic-Disentangled
Prosody Adapting for Movie Dubbing",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "172-182",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372400"}

@inproceedings{bb378306,
        AUTHOR = "Rai, A. and Sridhar, S.",
        TITLE = "EgoSonics: Generating Synchronized Audio for Silent Egocentric Videos",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "4935-4946",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372401"}

@inproceedings{bb378307,
        AUTHOR = "Yadav, A.K.S. and Bhagtani, K. and Salvi, D. and Bestagini, P. and Delp, E.J.",
        TITLE = "FairSSD: Understanding Bias in Synthetic Speech Detectors",
        BOOKTITLE = WMF24,
        YEAR = "2024",
        PAGES = "4418-4428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372402"}

@inproceedings{bb378308,
        AUTHOR = "Cuccovillo, L. and Gerhardt, M. and Aichroth, P.",
        TITLE = "Audio Transformer for Synthetic Speech Detection via Multi-Formant
Analysis",
        BOOKTITLE = WMF24,
        YEAR = "2024",
        PAGES = "4409-4417",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372403"}

@inproceedings{bb378309,
        AUTHOR = "Cong, G.X. and Li, L. and Qi, Y.K. and Zha, Z.J. and Wu, Q. and Wang, W.Y. and Jiang, B. and Yang, M.H. and Huang, Q.M.",
        TITLE = "Learning to Dub Movies via Hierarchical Prosody Models",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "14687-14697",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372404"}

@inproceedings{bb378310,
        AUTHOR = "Hsu, W.N. and Remez, T. and Shi, B. and Donley, J. and Adi, Y.",
        TITLE = "ReVISE: Self-Supervised Speech Resynthesis with Visual Input for
Universal and Generalized Speech Regeneration",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "18796-18806",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372405"}

@inproceedings{bb378311,
        AUTHOR = "Sun, C.Z. and Jia, S. and Hou, S.W. and Lyu, S.W.",
        TITLE = "AI-Synthesized Voice Detection Using Neural Vocoder Artifacts",
        BOOKTITLE = WMF23,
        YEAR = "2023",
        PAGES = "904-912",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372406"}

@inproceedings{bb378312,
        AUTHOR = "Noufi, C. and May, L. and Berger, J.",
        TITLE = "The Role of Vocal Persona in Natural and Synthesized Speech",
        BOOKTITLE = FG23,
        YEAR = "2023",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372407"}

@inproceedings{bb378313,
        AUTHOR = "Hwang, I.S. and Lee, S.H. and Lee, S.W.",
        TITLE = "StyleVC: Non-Parallel Voice Conversion with Adversarial Style
Generalization",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "23-30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372408"}

@inproceedings{bb378314,
        AUTHOR = "Wang, W.B. and Song, Y. and Jha, S.",
        TITLE = "Autolv: Automatic Lecture Video Generator",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "1086-1090",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372409"}

@inproceedings{bb378315,
        AUTHOR = "Borzi, S. and Giudice, O. and Stanco, F. and Allegra, D.",
        TITLE = "Is synthetic voice detection research going into the right direction?",
        BOOKTITLE = WMF22,
        YEAR = "2022",
        PAGES = "71-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372410"}

@inproceedings{bb378316,
        AUTHOR = "Hassid, M. and Ramanovich, M.T. and Shillingford, B. and Wang, M. and Jia, Y. and Remez, T.",
        TITLE = "More than Words: In-the-Wild Visually-Driven Prosody for
Text-to-Speech",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "10577-10587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372411"}

@inproceedings{bb378317,
        AUTHOR = "Kwak, I.Y. and Kwag, S. and Lee, J. and Huh, J.H. and Lee, C.H. and Jeon, Y.B. and Hwang, J.H. and Yoon, J.W.",
        TITLE = "ResMax: Detecting Voice Spoofing Attacks with Residual Network and
Max Feature Map",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "4837-4844",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372412"}

@inproceedings{bb378318,
        AUTHOR = "Wang, D.H. and Wang, R. and Dong, L. and Yan, D. and Ren, Y.M.",
        TITLE = "Efficient Generation of Speech Adversarial Examples with Generative
Model",
        BOOKTITLE = IWDW20,
        YEAR = "2020",
        PAGES = "251-264",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372413"}

@inproceedings{bb378319,
        AUTHOR = "Zhou, H. and Liu, Z. and Xu, X. and Luo, P. and Wang, X.",
        TITLE = "Vision-Infused Deep Audio Inpainting",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "283-292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372414"}

@inproceedings{bb378320,
        AUTHOR = "Bailer, W. and Wijnants, M. and Lievens, H. and Claes, S.",
        TITLE = "Multimedia Analytics Challenges and Opportunities for Creating
Interactive Radio Content",
        BOOKTITLE = MMMod20,
        YEAR = "2020",
        PAGES = "II:375-387",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372415"}

@inproceedings{bb378321,
        AUTHOR = "Huang, T. and Wang, H.X. and Chen, Y. and He, P.S.",
        TITLE = "GRU-SVM Model for Synthetic Speech Detection",
        BOOKTITLE = IWDW19,
        YEAR = "2019",
        PAGES = "115-125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372416"}

@inproceedings{bb378322,
        AUTHOR = "Wong, A. and Xu, A. and Dudek, G.",
        TITLE = "Investigating Trust Factors in Human-Robot Shared Control:
Implicit Gender Bias Around Robot Voice",
        BOOKTITLE = CRV19,
        YEAR = "2019",
        PAGES = "195-200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372417"}

@inproceedings{bb378323,
        AUTHOR = "Xiao, L. and Wang, Z.",
        TITLE = "Dense Convolutional Recurrent Neural Network for Generalized Speech
Animation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "633-638",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372418"}

@inproceedings{bb378324,
        AUTHOR = "Shah, N.J. and Patil, H.A.",
        TITLE = "Analysis of Features and Metrics for Alignment in Text-Dependent Voice
Conversion",
        BOOKTITLE = PReMI17,
        YEAR = "2017",
        PAGES = "299-307",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372419"}

@inproceedings{bb378325,
        AUTHOR = "Rybarova, R. and Drozd, I. and Rozinaj, G.",
        TITLE = "GUI for interactive speech synthesis",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372420"}

@inproceedings{bb378326,
        AUTHOR = "Coto Jimenez, M. and Goddard Close, J.",
        TITLE = "LSTM Deep Neural Networks Postfiltering for Improving the Quality of
Synthetic Voices",
        BOOKTITLE = MCPR16,
        YEAR = "2016",
        PAGES = "280-289",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372421"}

@inproceedings{bb378327,
        AUTHOR = "Vasek, M. and Rozinaj, G. and Rybarova, R.",
        TITLE = "Letter-To-Sound conversion for speech synthesizer",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372422"}

@inproceedings{bb378328,
        AUTHOR = "Rybarova, R. and del Corral, G. and Rozinaj, G.",
        TITLE = "Diphone spanish text-to-speech synthesizer",
        BOOKTITLE = WSSIP15,
        YEAR = "2015",
        PAGES = "121-124",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372423"}

@inproceedings{bb378329,
        AUTHOR = "Verma, R. and Sarkar, P. and Rao, K.S.",
        TITLE = "Conversion of neutral speech to storytelling style speech",
        BOOKTITLE = ICAPR15,
        YEAR = "2015",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372424"}

@inproceedings{bb378330,
        AUTHOR = "Narendra, N.P. and Rao, K.S.",
        TITLE = "Optimal residual frame based source modeling for HMM-based speech
synthesis",
        BOOKTITLE = ICAPR15,
        YEAR = "2015",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372425"}

@inproceedings{bb378331,
        AUTHOR = "Wang, Y. and Tao, J.H. and Yang, M.H. and Li, Y.",
        TITLE = "Extended Decision Tree with or Relationship for HMM-Based Speech
Synthesis",
        BOOKTITLE = ACPR13,
        YEAR = "2013",
        PAGES = "225-229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372426"}

@inproceedings{bb378332,
        AUTHOR = "Gao, L. and Yu, H.Z. and Zhang, J.H. and Fang, H.P.",
        TITLE = "Research on HMM_based speech synthesis for Lhasa dialect",
        BOOKTITLE = IASP11,
        YEAR = "2011",
        PAGES = "429-433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372427"}

@inproceedings{bb378333,
        AUTHOR = "Chakraborty, R. and Garain, U.",
        TITLE = "Role of Synthetically Generated Samples on Speech Recognition in a
Resource-Scarce Language",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "1618-1621",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372428"}

@inproceedings{bb378334,
        AUTHOR = "Rao, K.S. and Maity, S. and Taru, A. and Koolagudi, S.G.",
        TITLE = "Unit Selection Using Linguistic, Prosodic and Spectral Distance for
Developing Text-to-Speech System in Hindi",
        BOOKTITLE = PReMI09,
        YEAR = "2009",
        PAGES = "531-536",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372429"}

@inproceedings{bb378335,
        AUTHOR = "Bahrampour, A. and Barkhoda, W. and Azami, B.Z.",
        TITLE = "Implementation of Three Text to Speech Systems for Kurdish Language",
        BOOKTITLE = CIARP09,
        YEAR = "2009",
        PAGES = "321-328",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372430"}

@inproceedings{bb378336,
        AUTHOR = "Shirbahadurkar, S.D. and Bormane, D.S.",
        TITLE = "Marathi Language Speech Synthesizer Using Concatenative Synthesis
Strategy (Spoken in Maharashtra, India)",
        BOOKTITLE = ICMV09,
        YEAR = "2009",
        PAGES = "181-185",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372431"}

@inproceedings{bb378337,
        AUTHOR = "Tuckova, J. and Holub, J. and Dubeda, T.",
        TITLE = "Technical and Phonetic Aspects of Speech Quality Assessment:
The Case of Prosody Synthesis",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "126-132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372432"}

@inproceedings{bb378338,
        AUTHOR = "Bauer, D. and Kannampuzha, J. and Kroger, B.J.",
        TITLE = "Articulatory Speech Re-synthesis:
Profiting from Natural Acoustic Speech Data",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "344-355",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372433"}

@inproceedings{bb378339,
        AUTHOR = "Gu, H.Y. and Cai, C.L. and Cai, S.F.",
        TITLE = "An HNM-Based Speaker-Nonspecific Timbre Transformation Scheme for
Speech Synthesis",
        BOOKTITLE = CISP09,
        YEAR = "2009",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372434"}

@article{bb378340,
        AUTHOR = "Lung, S.Y. and Chen, C.C.T.",
        TITLE = "A new approach for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "33",
        YEAR = "2000",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1401-1403",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372435"}

@article{bb378341,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Multi-resolution form of SVD for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "35",
        YEAR = "2002",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1637-1639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372436"}

@article{bb378342,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Further reduced form of wavelet feature for text independent speaker
recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1565-1566",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372437"}

@article{bb378343,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Feature extracted from wavelet eigenfunction estimation for
text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1543-1544",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372438"}

@article{bb378344,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Wavelet feature domain adaptive noise reduction using learning
algorithm for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2603-2606",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372439"}

@article{bb378345,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Efficient text independent speaker recognition with wavelet feature
selection based multilayered neural network using supervised learning
algorithm",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "3616-3620",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372440"}

@article{bb378346,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Distributed genetic algorithm for Gaussian mixture model based speaker
identification",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2479-2481",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372441"}

@article{bb378347,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Adaptive fuzzy wavelet algorithm for text-independent speaker
recognition",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2095-2096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372442"}

@article{bb378348,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Wavelet feature selection based neural networks with application to the
text independent speaker identification",
        JOURNAL = PR,
        VOLUME = "39",
        YEAR = "2006",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1518-1521",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372443"}

@article{bb378349,
        AUTHOR = "Lung, S.Y.",
        TITLE = "Feature extracted from wavelet decomposition using biorthogonal Riesz
basis for text-independent speaker recognition",
        JOURNAL = PR,
        VOLUME = "41",
        YEAR = "2008",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "3068-3070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372444"}

@article{bb378350,
        AUTHOR = "Chen, K. and Wu, T.Y. and Zhang, H.J.",
        TITLE = "On the use of nearest feature line for speaker identification",
        JOURNAL = PRL,
        VOLUME = "23",
        YEAR = "2002",
        NUMBER = "14",
        MONTH = "December",
        PAGES = "1735-1746",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372445"}

@article{bb378351,
        AUTHOR = "Ramachandran, R.P. and Farrell, K.R. and Ramachandran, R. and Mammone, R.J.",
        TITLE = "Speaker recognition:
general classifier approaches and data fusion methods",
        JOURNAL = PR,
        VOLUME = "35",
        YEAR = "2002",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "2801-2821",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372446"}

@article{bb378352,
        AUTHOR = "Chen, K.",
        TITLE = "Towards better making a decision in speaker verification",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "329-346",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372447"}

@article{bb378353,
        AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C. and Alba Castro, J.L.",
        TITLE = "On combining classifiers for speaker authentication",
        JOURNAL = PR,
        VOLUME = "36",
        YEAR = "2003",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "347-359",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372448"}

@article{bb378354,
        AUTHOR = "Damper, R.I. and Higgins, J.E.",
        TITLE = "Improving speaker identification in noise by subband processing and
decision fusion",
        JOURNAL = PRL,
        VOLUME = "24",
        YEAR = "2003",
        NUMBER = "13",
        MONTH = "September",
        PAGES = "2167-2173",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372449"}

@article{bb378355,
        AUTHOR = "Besacier, L. and Mayorga, P. and Bonastre, J.F. and Fredouille, C. and Meignier, S.",
        TITLE = "Overview of compression and packet loss effects in speech biometrics",
        JOURNAL = VISP,
        VOLUME = "150",
        YEAR = "2003",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "372-376",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372450"}

@inproceedings{bb378356,
        AUTHOR = "Besacier, L. and Bonastre, J.F.",
        TITLE = "Time and frequency pruning for speaker identification",
        BOOKTITLE = ICPR98,
        YEAR = "1998",
        PAGES = "Vol II: 1619-1621",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372451"}

@article{bb378357,
        AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C.",
        TITLE = "Application of fusion techniques to speaker authentication over ip
networks",
        JOURNAL = VISP,
        VOLUME = "150",
        YEAR = "2003",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "377-382",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372452"}

@article{bb378358,
        AUTHOR = "Chen, C.C.T. and Chen, C.T. and Hou, C.K.",
        TITLE = "Speaker identification using hybrid Karhunen-Loeve transform and
Gaussian mixture model approach",
        JOURNAL = PR,
        VOLUME = "37",
        YEAR = "2004",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1073-1075",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372453"}

@article{bb378359,
        AUTHOR = "Lee, K.Y.",
        TITLE = "Local fuzzy PCA based GMM with dimension reduction on speaker
identification",
        JOURNAL = PRL,
        VOLUME = "25",
        YEAR = "2004",
        NUMBER = "16",
        MONTH = "December",
        PAGES = "1811-1817",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372454"}

@article{bb378360,
        AUTHOR = "Mashao, D.J. and Skosan, M.",
        TITLE = "Combining classifier decisions for robust speaker identification",
        JOURNAL = PR,
        VOLUME = "39",
        YEAR = "2006",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "147-155",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372455"}

@article{bb378361,
        AUTHOR = "Skosan, M. and Mashao, D.J.",
        TITLE = "Modified Segmental Histogram Equalization for robust speaker
verification",
        JOURNAL = PRL,
        VOLUME = "27",
        YEAR = "2006",
        NUMBER = "5",
        MONTH = "April",
        PAGES = "479-486",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372456"}

@article{bb378362,
        AUTHOR = "Ariyaeeinia, A.M. and Fortuna, J. and Sivakumaran, P. and Malegaonkar, A.",
        TITLE = "Verification effectiveness in open-set speaker identification",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "5",
        MONTH = "October",
        PAGES = "618-624",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372457"}

@article{bb378363,
        AUTHOR = "Zhou, G. and Mikhael, W.B.",
        TITLE = "Speaker identification based on adaptive discriminative vector
quantisation",
        JOURNAL = VISP,
        VOLUME = "153",
        YEAR = "2006",
        NUMBER = "6",
        MONTH = "December",
        PAGES = "754-760",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372458"}

@article{bb378364,
        AUTHOR = "Park, C.M. and Thapa, D. and Wang, G.N.",
        TITLE = "Speech authentication system using digital watermarking and pattern
recovery",
        JOURNAL = PRL,
        VOLUME = "28",
        YEAR = "2007",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "931-938",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372459"}

@article{bb378365,
        AUTHOR = "Faundez Zanuy, M. and Hagmuller, M. and Kubin, G.",
        TITLE = "Speaker identification security improvement by means of speech
watermarking",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3027-3034",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372460"}

@article{bb378366,
        AUTHOR = "Chetouani, M. and Faundez Zanuy, M. and Gas, B. and Zarader, J.L.",
        TITLE = "Investigation on LP-residual representations for speaker identification",
        JOURNAL = PR,
        VOLUME = "42",
        YEAR = "2009",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "487-494",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372461"}

@article{bb378367,
        AUTHOR = "Kinnunen, T. and Saastamoinen, J. and Hautamaki, V. and Vinni, M. and Franti, P.",
        TITLE = "Comparative evaluation of maximum a Posteriori vector quantization and
Gaussian mixture models in speaker verification",
        JOURNAL = PRL,
        VOLUME = "30",
        YEAR = "2009",
        NUMBER = "4",
        MONTH = "March",
        PAGES = "341-347",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372462"}

@article{bb378368,
        AUTHOR = "Chao, Y.H. and Tsai, W.H. and Wang, H.M. and Chang, R.C.",
        TITLE = "Improving the characterization of the alternative hypothesis via
minimum verification error training with applications to speaker
verification",
        JOURNAL = PR,
        VOLUME = "42",
        YEAR = "2009",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1351-1360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372463"}

@article{bb378369,
        AUTHOR = "Temko, A. and Nadeu, C.",
        TITLE = "Acoustic event detection in meeting-room environments",
        JOURNAL = PRL,
        VOLUME = "30",
        YEAR = "2009",
        NUMBER = "14",
        MONTH = "October",
        PAGES = "1281-1288",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372464"}

@article{bb378370,
        AUTHOR = "Kim, S. and Ji, M.Y. and Kim, H.",
        TITLE = "Robust speaker recognition based on filtering in autocorrelation domain
and sub-band feature recombination",
        JOURNAL = PRL,
        VOLUME = "31",
        YEAR = "2010",
        NUMBER = "7",
        MONTH = "May",
        PAGES = "593-599",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372465"}

@article{bb378371,
        AUTHOR = "Li, H. and Ma, B. and Lee, K.A.",
        TITLE = "Spoken Language Recognition: From Fundamentals to Practice",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1136-1159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372466"}

@article{bb378372,
        AUTHOR = "Li, H. and Ma, B.",
        TITLE = "TechWare: Speaker and Spoken Language Recognition Resources",
        JOURNAL = SPMag,
        VOLUME = "27",
        YEAR = "2010",
        NUMBER = "6",
        PAGES = "139-142",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372467"}

@article{bb378373,
        AUTHOR = "Ajmera, P.K. and Jadhav, D.V. and Holambe, R.S.",
        TITLE = "Text-independent speaker identification using Radon and discrete cosine
transforms based features from speech spectrogram",
        JOURNAL = PR,
        VOLUME = "44",
        YEAR = "2011",
        NUMBER = "10-11",
        MONTH = "October",
        PAGES = "2749-2759",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372468"}

@article{bb378374,
        AUTHOR = "Kinnunen, T. and Sidoroff, I. and Tuononen, M. and Franti, P.",
        TITLE = "Comparison of clustering methods:
A case study of text-independent speaker modeling",
        JOURNAL = PRL,
        VOLUME = "32",
        YEAR = "2011",
        NUMBER = "13",
        MONTH = "October",
        PAGES = "1604-1617",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372469"}

@inproceedings{bb378375,
        AUTHOR = "Kinnunen, T. and Karpov, E. and Franti, P.",
        TITLE = "A Speaker Pruning Algorithm for Real-Time Speaker Identification",
        BOOKTITLE = AVBPA03,
        YEAR = "2003",
        PAGES = "639-646",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372470"}

@inproceedings{bb378376,
        AUTHOR = "Kinnunen, T. and Franti, P.",
        TITLE = "Speaker Discriminative Weighting Method for VQ-Based Speaker
Identification",
        BOOKTITLE = AVBPA01,
        YEAR = "2001",
        PAGES = "150",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372471"}

@article{bb378377,
        AUTHOR = "Zao, L. and Coelho, R.",
        TITLE = "Colored Noise Based Multicondition Training Technique for Robust
Speaker Identification",
        JOURNAL = SPLetters,
        VOLUME = "18",
        YEAR = "2011",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "675-678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372472"}

@article{bb378378,
        AUTHOR = "Hanilci, C. and Kinnunen, T. and Ertas, F. and Saeidi, R. and Pohjalainen, J. and Alku, P.",
        TITLE = "Regularized All-Pole Models for Speaker Verification Under Noisy
Environments",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "163-166",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372473"}

@article{bb378379,
        AUTHOR = "Salamin, H. and Vinciarelli, A.",
        TITLE = "Automatic Role Recognition in Multiparty Conversations: An Approach
Based on Turn Organization, Prosody, and Conditional Random Fields",
        JOURNAL = MultMed,
        VOLUME = "14",
        YEAR = "2012",
        NUMBER = "2",
        PAGES = "338-345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372474"}

@article{bb378380,
        AUTHOR = "Tang, H. and Chu, S. and Hasegawa Johnson, M. and Huang, T.S.",
        TITLE = "Partially Supervised Speaker Clustering",
        JOURNAL = PAMI,
        VOLUME = "34",
        YEAR = "2012",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "959-971",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372475"}

@article{bb378381,
        AUTHOR = "Montalvao, J. and Araujo, M.R.R.",
        TITLE = "Is masking a relevant aspect lacking in MFCC? A speaker verification
perspective",
        JOURNAL = PRL,
        VOLUME = "33",
        YEAR = "2012",
        NUMBER = "16",
        MONTH = "December",
        PAGES = "2156-2165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372476"}

@article{bb378382,
        AUTHOR = "Garimella, S. and Mallidi, S.H. and Hermansky, H.",
        TITLE = "Regularized Auto-Associative Neural Networks for Speaker Verification",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "841-844",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372477"}

@article{bb378383,
        AUTHOR = "Sahidullah, M. and Saha, G.",
        TITLE = "A Novel Windowing Technique for Efficient Computation of MFCC for
Speaker Recognition",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "149-152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372478"}

@article{bb378384,
        AUTHOR = "Vallet, F. and Essid, S. and Carrive, J.",
        TITLE = "A Multimodal Approach to Speaker Diarization on TV Talk-Shows",
        JOURNAL = MultMed,
        VOLUME = "15",
        YEAR = "2013",
        NUMBER = "3",
        PAGES = "509-520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372479"}

@article{bb378385,
        AUTHOR = "Inthavisas, K. and Lopresti, D.",
        TITLE = "Secure speech biometric templates for user authentication",
        JOURNAL = IET-Bio,
        VOLUME = "1",
        YEAR = "2012",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "46-54",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372480"}

@article{bb378386,
        AUTHOR = "Pillay, S. and Ariyaeeinia, A. and Sivakumaran, P. and Pawlewski, M.",
        TITLE = "Effective speaker verification via dynamic mismatch compensation",
        JOURNAL = IET-Bio,
        VOLUME = "1",
        YEAR = "2012",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "130-135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372481"}

@article{bb378387,
        AUTHOR = "Bhardwaj, S. and Srivastava, S. and Hanmandlu, M. and Gupta, J.R.P.",
        TITLE = "GFM-Based Methods for Speaker Identification",
        JOURNAL = Cyber,
        VOLUME = "43",
        YEAR = "2013",
        NUMBER = "3",
        PAGES = "1047-1058",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372482"}

@article{bb378388,
        AUTHOR = "Pekhovsky, T. and Sizov, A.",
        TITLE = "Comparison between supervised and unsupervised learning of
probabilistic linear discriminant analysis mixture models for speaker
verification",
        JOURNAL = PRL,
        VOLUME = "34",
        YEAR = "2013",
        NUMBER = "11",
        MONTH = "August",
        PAGES = "1307-1313",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372483"}

@article{bb378389,
        AUTHOR = "Yaman, S. and Pelecanos, J.",
        TITLE = "Using Polynomial Kernel Support Vector Machines for Speaker
Verification",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "9",
        PAGES = "901-904",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372484"}

@article{bb378390,
        AUTHOR = "Bin Amin, T. and Marziliano, P. and German, J.S.",
        TITLE = "Glottal and Vocal Tract Characteristics of Voice Impersonators",
        JOURNAL = MultMed,
        VOLUME = "16",
        YEAR = "2014",
        NUMBER = "3",
        MONTH = "April",
        PAGES = "668-678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372485"}

@article{bb378391,
        AUTHOR = "Sarkar, A.K. and Do, C.T. and Le, V.B. and Barras, C.",
        TITLE = "Combination of Cepstral and Phonetically Discriminative Features for
Speaker Verification",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1040-1044",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372486"}

@article{bb378392,
        AUTHOR = "Yang, H. and Xu, Y. and Huang, H. and Zhou, R. and Yan, Y.",
        TITLE = "Voice biometrics using linear Gaussian model",
        JOURNAL = IET-Bio,
        VOLUME = "3",
        YEAR = "2014",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "9-15",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372487"}

@article{bb378393,
        AUTHOR = "Ribas Gonzalez, D. and Calvo de Lara, J.R.",
        TITLE = "Feature classification criterion for missing features mask estimation
in robust speaker recognition",
        JOURNAL = SIViP,
        VOLUME = "8",
        YEAR = "2014",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "365-375",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372488"}

@article{bb378394,
        AUTHOR = "Hernandez Sierra, G. and Calvo, J.R. and Bonastre, J.F. and Bousquet, P.M.",
        TITLE = "Session compensation using binary speech representation for speaker
recognition",
        JOURNAL = PRL,
        VOLUME = "49",
        YEAR = "2014",
        NUMBER = "1",
        PAGES = "17-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372489"}

@inproceedings{bb378395,
        AUTHOR = "Lainez, J.E.G. and Gonzalez, D.R. and Artiaga, A.M. and Solano, E.L. and de Lara, J.R.C.",
        TITLE = "Beam-search Formant Tracking Algorithm Based on Trajectory Functions
for Continuous Speech",
        BOOKTITLE = CIARP12,
        YEAR = "2012",
        PAGES = "749-756",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372490"}

@inproceedings{bb378396,
        AUTHOR = "Reyes Diaz, F.J. and Calvo de Lara, J.R. and Hernandez Sierra, G.",
        TITLE = "Gaussian Selection for Speaker Recognition Using Cumulative Vectors",
        BOOKTITLE = CIARP12,
        YEAR = "2012",
        PAGES = "724-731",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372491"}

@inproceedings{bb378397,
        AUTHOR = "Hernandez Sierra, G. and Calvo de Lara, J.R. and Bonastre, J.F.",
        TITLE = "Temporal Information in a Binary Framework for Speaker Recognition",
        BOOKTITLE = CIARP14,
        YEAR = "2014",
        PAGES = "207-213",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372492"}

@inproceedings{bb378398,
        AUTHOR = "Hernandez Sierra, G. and Bonastre, J.F. and Calvo de Lara, J.R.",
        TITLE = "Speaker Recognition Using a Binary Representation and Specificities
Models",
        BOOKTITLE = CIARP12,
        YEAR = "2012",
        PAGES = "732-739",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372493"}

@article{bb378399,
        AUTHOR = "Pohjalainen, J. and Hanilci, C. and Kinnunen, T. and Alku, P.",
        TITLE = "Mixture Linear Prediction in Speaker Verification Under Vocal Effort
Mismatch",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "1516-1520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372494"}

Last update:Apr 6, 2026 at 11:28:57