@article{bb378300,
AUTHOR = "Haji Ali, M. and Menapace, W. and Siarohin, A. and Balakrishnan, G. and Ordonez, V.",
TITLE = "Taming Data and Transformers for Audio Generation",
JOURNAL = IJCV,
VOLUME = "134",
YEAR = "2026",
NUMBER = "1",
MONTH = "January",
PAGES = "87",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372395"}
@inproceedings{bb378301,
AUTHOR = "Liu, J. and Geddes, J. and Guo, Z.Y. and Jiang, H. and Nandwana, M.K.",
TITLE = "Smooth Cache: A Universal Inference Acceleration Technique for
Diffusion Transformers",
BOOKTITLE = LargeVM25,
YEAR = "2025",
PAGES = "3220-3229",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372396"}
@inproceedings{bb378302,
AUTHOR = "Kushwaha, S.S. and Tian, Y.P.",
TITLE = "VinTAGe: Joint Video and Text Conditioning for Holistic Audio
Generation",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "13529-13539",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372397"}
@inproceedings{bb378303,
AUTHOR = "Kim, J.H. and Choi, J. and Kim, J.H. and Jung, C. and Chung, J.S.",
TITLE = "From Faces to Voices: Learning Hierarchical Representations for
High-quality Video-to-Speech",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "15874-15884",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372398"}
@inproceedings{bb378304,
AUTHOR = "Cong, G.X. and Pan, J. and Li, L. and Qi, Y.K. and Peng, Y.X. and van den Hengel, A.J. and Yang, J. and Huang, Q.M.",
TITLE = "EmoDubber: Towards High Quality and Emotion Controllable Movie
Dubbing",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "15863-15873",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372399"}
@inproceedings{bb378305,
AUTHOR = "Zhang, Z.D. and Li, L. and Yan, C.G. and Liu, C.S. and van den Hengel, A.J. and Qi, Y.K.",
TITLE = "Prosody-Enhanced Acoustic Pre-training and Acoustic-Disentangled
Prosody Adapting for Movie Dubbing",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "172-182",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372400"}
@inproceedings{bb378306,
AUTHOR = "Rai, A. and Sridhar, S.",
TITLE = "EgoSonics: Generating Synchronized Audio for Silent Egocentric Videos",
BOOKTITLE = WACV25,
YEAR = "2025",
PAGES = "4935-4946",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372401"}
@inproceedings{bb378307,
AUTHOR = "Yadav, A.K.S. and Bhagtani, K. and Salvi, D. and Bestagini, P. and Delp, E.J.",
TITLE = "FairSSD: Understanding Bias in Synthetic Speech Detectors",
BOOKTITLE = WMF24,
YEAR = "2024",
PAGES = "4418-4428",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372402"}
@inproceedings{bb378308,
AUTHOR = "Cuccovillo, L. and Gerhardt, M. and Aichroth, P.",
TITLE = "Audio Transformer for Synthetic Speech Detection via Multi-Formant
Analysis",
BOOKTITLE = WMF24,
YEAR = "2024",
PAGES = "4409-4417",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372403"}
@inproceedings{bb378309,
AUTHOR = "Cong, G.X. and Li, L. and Qi, Y.K. and Zha, Z.J. and Wu, Q. and Wang, W.Y. and Jiang, B. and Yang, M.H. and Huang, Q.M.",
TITLE = "Learning to Dub Movies via Hierarchical Prosody Models",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "14687-14697",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372404"}
@inproceedings{bb378310,
AUTHOR = "Hsu, W.N. and Remez, T. and Shi, B. and Donley, J. and Adi, Y.",
TITLE = "ReVISE: Self-Supervised Speech Resynthesis with Visual Input for
Universal and Generalized Speech Regeneration",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "18796-18806",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372405"}
@inproceedings{bb378311,
AUTHOR = "Sun, C.Z. and Jia, S. and Hou, S.W. and Lyu, S.W.",
TITLE = "AI-Synthesized Voice Detection Using Neural Vocoder Artifacts",
BOOKTITLE = WMF23,
YEAR = "2023",
PAGES = "904-912",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372406"}
@inproceedings{bb378312,
AUTHOR = "Noufi, C. and May, L. and Berger, J.",
TITLE = "The Role of Vocal Persona in Natural and Synthesized Speech",
BOOKTITLE = FG23,
YEAR = "2023",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372407"}
@inproceedings{bb378313,
AUTHOR = "Hwang, I.S. and Lee, S.H. and Lee, S.W.",
TITLE = "StyleVC: Non-Parallel Voice Conversion with Adversarial Style
Generalization",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "23-30",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372408"}
@inproceedings{bb378314,
AUTHOR = "Wang, W.B. and Song, Y. and Jha, S.",
TITLE = "Autolv: Automatic Lecture Video Generator",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "1086-1090",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372409"}
@inproceedings{bb378315,
AUTHOR = "Borzi, S. and Giudice, O. and Stanco, F. and Allegra, D.",
TITLE = "Is synthetic voice detection research going into the right direction?",
BOOKTITLE = WMF22,
YEAR = "2022",
PAGES = "71-80",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372410"}
@inproceedings{bb378316,
AUTHOR = "Hassid, M. and Ramanovich, M.T. and Shillingford, B. and Wang, M. and Jia, Y. and Remez, T.",
TITLE = "More than Words: In-the-Wild Visually-Driven Prosody for
Text-to-Speech",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "10577-10587",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372411"}
@inproceedings{bb378317,
AUTHOR = "Kwak, I.Y. and Kwag, S. and Lee, J. and Huh, J.H. and Lee, C.H. and Jeon, Y.B. and Hwang, J.H. and Yoon, J.W.",
TITLE = "ResMax: Detecting Voice Spoofing Attacks with Residual Network and
Max Feature Map",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "4837-4844",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372412"}
@inproceedings{bb378318,
AUTHOR = "Wang, D.H. and Wang, R. and Dong, L. and Yan, D. and Ren, Y.M.",
TITLE = "Efficient Generation of Speech Adversarial Examples with Generative
Model",
BOOKTITLE = IWDW20,
YEAR = "2020",
PAGES = "251-264",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372413"}
@inproceedings{bb378319,
AUTHOR = "Zhou, H. and Liu, Z. and Xu, X. and Luo, P. and Wang, X.",
TITLE = "Vision-Infused Deep Audio Inpainting",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "283-292",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372414"}
@inproceedings{bb378320,
AUTHOR = "Bailer, W. and Wijnants, M. and Lievens, H. and Claes, S.",
TITLE = "Multimedia Analytics Challenges and Opportunities for Creating
Interactive Radio Content",
BOOKTITLE = MMMod20,
YEAR = "2020",
PAGES = "II:375-387",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372415"}
@inproceedings{bb378321,
AUTHOR = "Huang, T. and Wang, H.X. and Chen, Y. and He, P.S.",
TITLE = "GRU-SVM Model for Synthetic Speech Detection",
BOOKTITLE = IWDW19,
YEAR = "2019",
PAGES = "115-125",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372416"}
@inproceedings{bb378322,
AUTHOR = "Wong, A. and Xu, A. and Dudek, G.",
TITLE = "Investigating Trust Factors in Human-Robot Shared Control:
Implicit Gender Bias Around Robot Voice",
BOOKTITLE = CRV19,
YEAR = "2019",
PAGES = "195-200",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372417"}
@inproceedings{bb378323,
AUTHOR = "Xiao, L. and Wang, Z.",
TITLE = "Dense Convolutional Recurrent Neural Network for Generalized Speech
Animation",
BOOKTITLE = ICPR18,
YEAR = "2018",
PAGES = "633-638",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372418"}
@inproceedings{bb378324,
AUTHOR = "Shah, N.J. and Patil, H.A.",
TITLE = "Analysis of Features and Metrics for Alignment in Text-Dependent Voice
Conversion",
BOOKTITLE = PReMI17,
YEAR = "2017",
PAGES = "299-307",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372419"}
@inproceedings{bb378325,
AUTHOR = "Rybarova, R. and Drozd, I. and Rozinaj, G.",
TITLE = "GUI for interactive speech synthesis",
BOOKTITLE = WSSIP16,
YEAR = "2016",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372420"}
@inproceedings{bb378326,
AUTHOR = "Coto Jimenez, M. and Goddard Close, J.",
TITLE = "LSTM Deep Neural Networks Postfiltering for Improving the Quality of
Synthetic Voices",
BOOKTITLE = MCPR16,
YEAR = "2016",
PAGES = "280-289",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372421"}
@inproceedings{bb378327,
AUTHOR = "Vasek, M. and Rozinaj, G. and Rybarova, R.",
TITLE = "Letter-To-Sound conversion for speech synthesizer",
BOOKTITLE = WSSIP16,
YEAR = "2016",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372422"}
@inproceedings{bb378328,
AUTHOR = "Rybarova, R. and del Corral, G. and Rozinaj, G.",
TITLE = "Diphone spanish text-to-speech synthesizer",
BOOKTITLE = WSSIP15,
YEAR = "2015",
PAGES = "121-124",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372423"}
@inproceedings{bb378329,
AUTHOR = "Verma, R. and Sarkar, P. and Rao, K.S.",
TITLE = "Conversion of neutral speech to storytelling style speech",
BOOKTITLE = ICAPR15,
YEAR = "2015",
PAGES = "1-6",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372424"}
@inproceedings{bb378330,
AUTHOR = "Narendra, N.P. and Rao, K.S.",
TITLE = "Optimal residual frame based source modeling for HMM-based speech
synthesis",
BOOKTITLE = ICAPR15,
YEAR = "2015",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372425"}
@inproceedings{bb378331,
AUTHOR = "Wang, Y. and Tao, J.H. and Yang, M.H. and Li, Y.",
TITLE = "Extended Decision Tree with or Relationship for HMM-Based Speech
Synthesis",
BOOKTITLE = ACPR13,
YEAR = "2013",
PAGES = "225-229",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372426"}
@inproceedings{bb378332,
AUTHOR = "Gao, L. and Yu, H.Z. and Zhang, J.H. and Fang, H.P.",
TITLE = "Research on HMM_based speech synthesis for Lhasa dialect",
BOOKTITLE = IASP11,
YEAR = "2011",
PAGES = "429-433",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372427"}
@inproceedings{bb378333,
AUTHOR = "Chakraborty, R. and Garain, U.",
TITLE = "Role of Synthetically Generated Samples on Speech Recognition in a
Resource-Scarce Language",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "1618-1621",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372428"}
@inproceedings{bb378334,
AUTHOR = "Rao, K.S. and Maity, S. and Taru, A. and Koolagudi, S.G.",
TITLE = "Unit Selection Using Linguistic, Prosodic and Spectral Distance for
Developing Text-to-Speech System in Hindi",
BOOKTITLE = PReMI09,
YEAR = "2009",
PAGES = "531-536",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372429"}
@inproceedings{bb378335,
AUTHOR = "Bahrampour, A. and Barkhoda, W. and Azami, B.Z.",
TITLE = "Implementation of Three Text to Speech Systems for Kurdish Language",
BOOKTITLE = CIARP09,
YEAR = "2009",
PAGES = "321-328",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372430"}
@inproceedings{bb378336,
AUTHOR = "Shirbahadurkar, S.D. and Bormane, D.S.",
TITLE = "Marathi Language Speech Synthesizer Using Concatenative Synthesis
Strategy (Spoken in Maharashtra, India)",
BOOKTITLE = ICMV09,
YEAR = "2009",
PAGES = "181-185",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372431"}
@inproceedings{bb378337,
AUTHOR = "Tuckova, J. and Holub, J. and Dubeda, T.",
TITLE = "Technical and Phonetic Aspects of Speech Quality Assessment:
The Case of Prosody Synthesis",
BOOKTITLE = COST08,
YEAR = "2008",
PAGES = "126-132",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372432"}
@inproceedings{bb378338,
AUTHOR = "Bauer, D. and Kannampuzha, J. and Kroger, B.J.",
TITLE = "Articulatory Speech Re-synthesis:
Profiting from Natural Acoustic Speech Data",
BOOKTITLE = COST08,
YEAR = "2008",
PAGES = "344-355",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372433"}
@inproceedings{bb378339,
AUTHOR = "Gu, H.Y. and Cai, C.L. and Cai, S.F.",
TITLE = "An HNM-Based Speaker-Nonspecific Timbre Transformation Scheme for
Speech Synthesis",
BOOKTITLE = CISP09,
YEAR = "2009",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024ss1.html#TT372434"}
@article{bb378340,
AUTHOR = "Lung, S.Y. and Chen, C.C.T.",
TITLE = "A new approach for text-independent speaker recognition",
JOURNAL = PR,
VOLUME = "33",
YEAR = "2000",
NUMBER = "8",
MONTH = "August",
PAGES = "1401-1403",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372435"}
@article{bb378341,
AUTHOR = "Lung, S.Y.",
TITLE = "Multi-resolution form of SVD for text-independent speaker recognition",
JOURNAL = PR,
VOLUME = "35",
YEAR = "2002",
NUMBER = "7",
MONTH = "July",
PAGES = "1637-1639",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372436"}
@article{bb378342,
AUTHOR = "Lung, S.Y.",
TITLE = "Further reduced form of wavelet feature for text independent speaker
recognition",
JOURNAL = PR,
VOLUME = "37",
YEAR = "2004",
NUMBER = "7",
MONTH = "July",
PAGES = "1565-1566",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372437"}
@article{bb378343,
AUTHOR = "Lung, S.Y.",
TITLE = "Feature extracted from wavelet eigenfunction estimation for
text-independent speaker recognition",
JOURNAL = PR,
VOLUME = "37",
YEAR = "2004",
NUMBER = "7",
MONTH = "July",
PAGES = "1543-1544",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372438"}
@article{bb378344,
AUTHOR = "Lung, S.Y.",
TITLE = "Wavelet feature domain adaptive noise reduction using learning
algorithm for text-independent speaker recognition",
JOURNAL = PR,
VOLUME = "40",
YEAR = "2007",
NUMBER = "9",
MONTH = "September",
PAGES = "2603-2606",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372439"}
@article{bb378345,
AUTHOR = "Lung, S.Y.",
TITLE = "Efficient text independent speaker recognition with wavelet feature
selection based multilayered neural network using supervised learning
algorithm",
JOURNAL = PR,
VOLUME = "40",
YEAR = "2007",
NUMBER = "12",
MONTH = "December",
PAGES = "3616-3620",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372440"}
@article{bb378346,
AUTHOR = "Lung, S.Y.",
TITLE = "Distributed genetic algorithm for Gaussian mixture model based speaker
identification",
JOURNAL = PR,
VOLUME = "36",
YEAR = "2003",
NUMBER = "10",
MONTH = "October",
PAGES = "2479-2481",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372441"}
@article{bb378347,
AUTHOR = "Lung, S.Y.",
TITLE = "Adaptive fuzzy wavelet algorithm for text-independent speaker
recognition",
JOURNAL = PR,
VOLUME = "37",
YEAR = "2004",
NUMBER = "10",
MONTH = "October",
PAGES = "2095-2096",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372442"}
@article{bb378348,
AUTHOR = "Lung, S.Y.",
TITLE = "Wavelet feature selection based neural networks with application to the
text independent speaker identification",
JOURNAL = PR,
VOLUME = "39",
YEAR = "2006",
NUMBER = "8",
MONTH = "August",
PAGES = "1518-1521",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372443"}
@article{bb378349,
AUTHOR = "Lung, S.Y.",
TITLE = "Feature extracted from wavelet decomposition using biorthogonal Riesz
basis for text-independent speaker recognition",
JOURNAL = PR,
VOLUME = "41",
YEAR = "2008",
NUMBER = "10",
MONTH = "October",
PAGES = "3068-3070",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372444"}
@article{bb378350,
AUTHOR = "Chen, K. and Wu, T.Y. and Zhang, H.J.",
TITLE = "On the use of nearest feature line for speaker identification",
JOURNAL = PRL,
VOLUME = "23",
YEAR = "2002",
NUMBER = "14",
MONTH = "December",
PAGES = "1735-1746",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372445"}
@article{bb378351,
AUTHOR = "Ramachandran, R.P. and Farrell, K.R. and Ramachandran, R. and Mammone, R.J.",
TITLE = "Speaker recognition:
general classifier approaches and data fusion methods",
JOURNAL = PR,
VOLUME = "35",
YEAR = "2002",
NUMBER = "12",
MONTH = "December",
PAGES = "2801-2821",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372446"}
@article{bb378352,
AUTHOR = "Chen, K.",
TITLE = "Towards better making a decision in speaker verification",
JOURNAL = PR,
VOLUME = "36",
YEAR = "2003",
NUMBER = "2",
MONTH = "February",
PAGES = "329-346",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372447"}
@article{bb378353,
AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C. and Alba Castro, J.L.",
TITLE = "On combining classifiers for speaker authentication",
JOURNAL = PR,
VOLUME = "36",
YEAR = "2003",
NUMBER = "2",
MONTH = "February",
PAGES = "347-359",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372448"}
@article{bb378354,
AUTHOR = "Damper, R.I. and Higgins, J.E.",
TITLE = "Improving speaker identification in noise by subband processing and
decision fusion",
JOURNAL = PRL,
VOLUME = "24",
YEAR = "2003",
NUMBER = "13",
MONTH = "September",
PAGES = "2167-2173",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372449"}
@article{bb378355,
AUTHOR = "Besacier, L. and Mayorga, P. and Bonastre, J.F. and Fredouille, C. and Meignier, S.",
TITLE = "Overview of compression and packet loss effects in speech biometrics",
JOURNAL = VISP,
VOLUME = "150",
YEAR = "2003",
NUMBER = "6",
MONTH = "December",
PAGES = "372-376",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372450"}
@inproceedings{bb378356,
AUTHOR = "Besacier, L. and Bonastre, J.F.",
TITLE = "Time and frequency pruning for speaker identification",
BOOKTITLE = ICPR98,
YEAR = "1998",
PAGES = "Vol II: 1619-1621",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372451"}
@article{bb378357,
AUTHOR = "Rodriguez Linares, L. and Garcia Mateo, C.",
TITLE = "Application of fusion techniques to speaker authentication over ip
networks",
JOURNAL = VISP,
VOLUME = "150",
YEAR = "2003",
NUMBER = "6",
MONTH = "December",
PAGES = "377-382",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372452"}
@article{bb378358,
AUTHOR = "Chen, C.C.T. and Chen, C.T. and Hou, C.K.",
TITLE = "Speaker identification using hybrid Karhunen-Loeve transform and
Gaussian mixture model approach",
JOURNAL = PR,
VOLUME = "37",
YEAR = "2004",
NUMBER = "5",
MONTH = "May",
PAGES = "1073-1075",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372453"}
@article{bb378359,
AUTHOR = "Lee, K.Y.",
TITLE = "Local fuzzy PCA based GMM with dimension reduction on speaker
identification",
JOURNAL = PRL,
VOLUME = "25",
YEAR = "2004",
NUMBER = "16",
MONTH = "December",
PAGES = "1811-1817",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372454"}
@article{bb378360,
AUTHOR = "Mashao, D.J. and Skosan, M.",
TITLE = "Combining classifier decisions for robust speaker identification",
JOURNAL = PR,
VOLUME = "39",
YEAR = "2006",
NUMBER = "1",
MONTH = "January",
PAGES = "147-155",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372455"}
@article{bb378361,
AUTHOR = "Skosan, M. and Mashao, D.J.",
TITLE = "Modified Segmental Histogram Equalization for robust speaker
verification",
JOURNAL = PRL,
VOLUME = "27",
YEAR = "2006",
NUMBER = "5",
MONTH = "April",
PAGES = "479-486",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372456"}
@article{bb378362,
AUTHOR = "Ariyaeeinia, A.M. and Fortuna, J. and Sivakumaran, P. and Malegaonkar, A.",
TITLE = "Verification effectiveness in open-set speaker identification",
JOURNAL = VISP,
VOLUME = "153",
YEAR = "2006",
NUMBER = "5",
MONTH = "October",
PAGES = "618-624",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372457"}
@article{bb378363,
AUTHOR = "Zhou, G. and Mikhael, W.B.",
TITLE = "Speaker identification based on adaptive discriminative vector
quantisation",
JOURNAL = VISP,
VOLUME = "153",
YEAR = "2006",
NUMBER = "6",
MONTH = "December",
PAGES = "754-760",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372458"}
@article{bb378364,
AUTHOR = "Park, C.M. and Thapa, D. and Wang, G.N.",
TITLE = "Speech authentication system using digital watermarking and pattern
recovery",
JOURNAL = PRL,
VOLUME = "28",
YEAR = "2007",
NUMBER = "8",
MONTH = "June",
PAGES = "931-938",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372459"}
@article{bb378365,
AUTHOR = "Faundez Zanuy, M. and Hagmuller, M. and Kubin, G.",
TITLE = "Speaker identification security improvement by means of speech
watermarking",
JOURNAL = PR,
VOLUME = "40",
YEAR = "2007",
NUMBER = "11",
MONTH = "November",
PAGES = "3027-3034",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372460"}
@article{bb378366,
AUTHOR = "Chetouani, M. and Faundez Zanuy, M. and Gas, B. and Zarader, J.L.",
TITLE = "Investigation on LP-residual representations for speaker identification",
JOURNAL = PR,
VOLUME = "42",
YEAR = "2009",
NUMBER = "3",
MONTH = "March",
PAGES = "487-494",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372461"}
@article{bb378367,
AUTHOR = "Kinnunen, T. and Saastamoinen, J. and Hautamaki, V. and Vinni, M. and Franti, P.",
TITLE = "Comparative evaluation of maximum a Posteriori vector quantization and
Gaussian mixture models in speaker verification",
JOURNAL = PRL,
VOLUME = "30",
YEAR = "2009",
NUMBER = "4",
MONTH = "March",
PAGES = "341-347",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372462"}
@article{bb378368,
AUTHOR = "Chao, Y.H. and Tsai, W.H. and Wang, H.M. and Chang, R.C.",
TITLE = "Improving the characterization of the alternative hypothesis via
minimum verification error training with applications to speaker
verification",
JOURNAL = PR,
VOLUME = "42",
YEAR = "2009",
NUMBER = "7",
MONTH = "July",
PAGES = "1351-1360",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372463"}
@article{bb378369,
AUTHOR = "Temko, A. and Nadeu, C.",
TITLE = "Acoustic event detection in meeting-room environments",
JOURNAL = PRL,
VOLUME = "30",
YEAR = "2009",
NUMBER = "14",
MONTH = "October",
PAGES = "1281-1288",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372464"}
@article{bb378370,
AUTHOR = "Kim, S. and Ji, M.Y. and Kim, H.",
TITLE = "Robust speaker recognition based on filtering in autocorrelation domain
and sub-band feature recombination",
JOURNAL = PRL,
VOLUME = "31",
YEAR = "2010",
NUMBER = "7",
MONTH = "May",
PAGES = "593-599",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372465"}
@article{bb378371,
AUTHOR = "Li, H. and Ma, B. and Lee, K.A.",
TITLE = "Spoken Language Recognition: From Fundamentals to Practice",
JOURNAL = PIEEE,
VOLUME = "100",
YEAR = "2013",
NUMBER = "5",
MONTH = "May",
PAGES = "1136-1159",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372466"}
@article{bb378372,
AUTHOR = "Li, H. and Ma, B.",
TITLE = "TechWare: Speaker and Spoken Language Recognition Resources",
JOURNAL = SPMag,
VOLUME = "27",
YEAR = "2010",
NUMBER = "6",
PAGES = "139-142",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372467"}
@article{bb378373,
AUTHOR = "Ajmera, P.K. and Jadhav, D.V. and Holambe, R.S.",
TITLE = "Text-independent speaker identification using Radon and discrete cosine
transforms based features from speech spectrogram",
JOURNAL = PR,
VOLUME = "44",
YEAR = "2011",
NUMBER = "10-11",
MONTH = "October",
PAGES = "2749-2759",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372468"}
@article{bb378374,
AUTHOR = "Kinnunen, T. and Sidoroff, I. and Tuononen, M. and Franti, P.",
TITLE = "Comparison of clustering methods:
A case study of text-independent speaker modeling",
JOURNAL = PRL,
VOLUME = "32",
YEAR = "2011",
NUMBER = "13",
MONTH = "October",
PAGES = "1604-1617",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372469"}
@inproceedings{bb378375,
AUTHOR = "Kinnunen, T. and Karpov, E. and Franti, P.",
TITLE = "A Speaker Pruning Algorithm for Real-Time Speaker Identification",
BOOKTITLE = AVBPA03,
YEAR = "2003",
PAGES = "639-646",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372470"}
@inproceedings{bb378376,
AUTHOR = "Kinnunen, T. and Franti, P.",
TITLE = "Speaker Discriminative Weighting Method for VQ-Based Speaker
Identification",
BOOKTITLE = AVBPA01,
YEAR = "2001",
PAGES = "150",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372471"}
@article{bb378377,
AUTHOR = "Zao, L. and Coelho, R.",
TITLE = "Colored Noise Based Multicondition Training Technique for Robust
Speaker Identification",
JOURNAL = SPLetters,
VOLUME = "18",
YEAR = "2011",
NUMBER = "11",
MONTH = "November",
PAGES = "675-678",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372472"}
@article{bb378378,
AUTHOR = "Hanilci, C. and Kinnunen, T. and Ertas, F. and Saeidi, R. and Pohjalainen, J. and Alku, P.",
TITLE = "Regularized All-Pole Models for Speaker Verification Under Noisy
Environments",
JOURNAL = SPLetters,
VOLUME = "19",
YEAR = "2012",
NUMBER = "3",
MONTH = "March",
PAGES = "163-166",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372473"}
@article{bb378379,
AUTHOR = "Salamin, H. and Vinciarelli, A.",
TITLE = "Automatic Role Recognition in Multiparty Conversations: An Approach
Based on Turn Organization, Prosody, and Conditional Random Fields",
JOURNAL = MultMed,
VOLUME = "14",
YEAR = "2012",
NUMBER = "2",
PAGES = "338-345",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372474"}
@article{bb378380,
AUTHOR = "Tang, H. and Chu, S. and Hasegawa Johnson, M. and Huang, T.S.",
TITLE = "Partially Supervised Speaker Clustering",
JOURNAL = PAMI,
VOLUME = "34",
YEAR = "2012",
NUMBER = "5",
MONTH = "May",
PAGES = "959-971",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372475"}
@article{bb378381,
AUTHOR = "Montalvao, J. and Araujo, M.R.R.",
TITLE = "Is masking a relevant aspect lacking in MFCC? A speaker verification
perspective",
JOURNAL = PRL,
VOLUME = "33",
YEAR = "2012",
NUMBER = "16",
MONTH = "December",
PAGES = "2156-2165",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372476"}
@article{bb378382,
AUTHOR = "Garimella, S. and Mallidi, S.H. and Hermansky, H.",
TITLE = "Regularized Auto-Associative Neural Networks for Speaker Verification",
JOURNAL = SPLetters,
VOLUME = "19",
YEAR = "2012",
NUMBER = "12",
MONTH = "December",
PAGES = "841-844",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372477"}
@article{bb378383,
AUTHOR = "Sahidullah, M. and Saha, G.",
TITLE = "A Novel Windowing Technique for Efficient Computation of MFCC for
Speaker Recognition",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "2",
MONTH = "February",
PAGES = "149-152",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372478"}
@article{bb378384,
AUTHOR = "Vallet, F. and Essid, S. and Carrive, J.",
TITLE = "A Multimodal Approach to Speaker Diarization on TV Talk-Shows",
JOURNAL = MultMed,
VOLUME = "15",
YEAR = "2013",
NUMBER = "3",
PAGES = "509-520",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372479"}
@article{bb378385,
AUTHOR = "Inthavisas, K. and Lopresti, D.",
TITLE = "Secure speech biometric templates for user authentication",
JOURNAL = IET-Bio,
VOLUME = "1",
YEAR = "2012",
NUMBER = "1",
MONTH = "March",
PAGES = "46-54",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372480"}
@article{bb378386,
AUTHOR = "Pillay, S. and Ariyaeeinia, A. and Sivakumaran, P. and Pawlewski, M.",
TITLE = "Effective speaker verification via dynamic mismatch compensation",
JOURNAL = IET-Bio,
VOLUME = "1",
YEAR = "2012",
NUMBER = "2",
MONTH = "June",
PAGES = "130-135",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372481"}
@article{bb378387,
AUTHOR = "Bhardwaj, S. and Srivastava, S. and Hanmandlu, M. and Gupta, J.R.P.",
TITLE = "GFM-Based Methods for Speaker Identification",
JOURNAL = Cyber,
VOLUME = "43",
YEAR = "2013",
NUMBER = "3",
PAGES = "1047-1058",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372482"}
@article{bb378388,
AUTHOR = "Pekhovsky, T. and Sizov, A.",
TITLE = "Comparison between supervised and unsupervised learning of
probabilistic linear discriminant analysis mixture models for speaker
verification",
JOURNAL = PRL,
VOLUME = "34",
YEAR = "2013",
NUMBER = "11",
MONTH = "August",
PAGES = "1307-1313",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372483"}
@article{bb378389,
AUTHOR = "Yaman, S. and Pelecanos, J.",
TITLE = "Using Polynomial Kernel Support Vector Machines for Speaker
Verification",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "9",
PAGES = "901-904",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372484"}
@article{bb378390,
AUTHOR = "Bin Amin, T. and Marziliano, P. and German, J.S.",
TITLE = "Glottal and Vocal Tract Characteristics of Voice Impersonators",
JOURNAL = MultMed,
VOLUME = "16",
YEAR = "2014",
NUMBER = "3",
MONTH = "April",
PAGES = "668-678",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372485"}
@article{bb378391,
AUTHOR = "Sarkar, A.K. and Do, C.T. and Le, V.B. and Barras, C.",
TITLE = "Combination of Cepstral and Phonetically Discriminative Features for
Speaker Verification",
JOURNAL = SPLetters,
VOLUME = "21",
YEAR = "2014",
NUMBER = "9",
MONTH = "September",
PAGES = "1040-1044",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372486"}
@article{bb378392,
AUTHOR = "Yang, H. and Xu, Y. and Huang, H. and Zhou, R. and Yan, Y.",
TITLE = "Voice biometrics using linear Gaussian model",
JOURNAL = IET-Bio,
VOLUME = "3",
YEAR = "2014",
NUMBER = "1",
MONTH = "March",
PAGES = "9-15",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372487"}
@article{bb378393,
AUTHOR = "Ribas Gonzalez, D. and Calvo de Lara, J.R.",
TITLE = "Feature classification criterion for missing features mask estimation
in robust speaker recognition",
JOURNAL = SIViP,
VOLUME = "8",
YEAR = "2014",
NUMBER = "2",
MONTH = "February",
PAGES = "365-375",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372488"}
@article{bb378394,
AUTHOR = "Hernandez Sierra, G. and Calvo, J.R. and Bonastre, J.F. and Bousquet, P.M.",
TITLE = "Session compensation using binary speech representation for speaker
recognition",
JOURNAL = PRL,
VOLUME = "49",
YEAR = "2014",
NUMBER = "1",
PAGES = "17-23",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372489"}
@inproceedings{bb378395,
AUTHOR = "Lainez, J.E.G. and Gonzalez, D.R. and Artiaga, A.M. and Solano, E.L. and de Lara, J.R.C.",
TITLE = "Beam-search Formant Tracking Algorithm Based on Trajectory Functions
for Continuous Speech",
BOOKTITLE = CIARP12,
YEAR = "2012",
PAGES = "749-756",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372490"}
@inproceedings{bb378396,
AUTHOR = "Reyes Diaz, F.J. and Calvo de Lara, J.R. and Hernandez Sierra, G.",
TITLE = "Gaussian Selection for Speaker Recognition Using Cumulative Vectors",
BOOKTITLE = CIARP12,
YEAR = "2012",
PAGES = "724-731",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372491"}
@inproceedings{bb378397,
AUTHOR = "Hernandez Sierra, G. and Calvo de Lara, J.R. and Bonastre, J.F.",
TITLE = "Temporal Information in a Binary Framework for Speaker Recognition",
BOOKTITLE = CIARP14,
YEAR = "2014",
PAGES = "207-213",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372492"}
@inproceedings{bb378398,
AUTHOR = "Hernandez Sierra, G. and Bonastre, J.F. and Calvo de Lara, J.R.",
TITLE = "Speaker Recognition Using a Binary Representation and Specificities
Models",
BOOKTITLE = CIARP12,
YEAR = "2012",
PAGES = "732-739",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372493"}
@article{bb378399,
AUTHOR = "Pohjalainen, J. and Hanilci, C. and Kinnunen, T. and Alku, P.",
TITLE = "Mixture Linear Prediction in Speaker Verification Under Vocal Effort
Mismatch",
JOURNAL = SPLetters,
VOLUME = "21",
YEAR = "2014",
NUMBER = "12",
MONTH = "December",
PAGES = "1516-1520",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024.html#TT372494"}
Last update:Apr 6, 2026 at 11:28:57