@article{bb378000,
AUTHOR = "Zhang, C. and Jiang, S.",
TITLE = "Detection of QIM-Based Steganography in VoIP Streams:
A MobileViT-Inspired Model",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "1735-1739",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372095"}
@article{bb378001,
AUTHOR = "Wang, Z.C. and Chen, Y.Z. and Wang, X.S. and Xie, L. and Wang, Y.P.",
TITLE = "StreamVoice+: Evolving Into End-to-End Streaming Zero-Shot Voice
Conversion",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "3000-3004",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372096"}
@article{bb378002,
AUTHOR = "Guo, N. and Edler, B.",
TITLE = "Frequency Domain Prediction of Tonal Signals With Time-Varying
Pitches",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "31-35",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372097"}
@article{bb378003,
AUTHOR = "Lopez Espejo, I. and Rosello, E. and Edraki, A. and Harte, N. and Jensen, J.",
TITLE = "Noise-Robust Hearing Aid Voice Control",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "241-245",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372098"}
@article{bb378004,
AUTHOR = "Xie, H. and Khorrami, K. and Rasanen, O. and Virtanen, T.",
TITLE = "Text-Based Audio Retrieval by Learning From Similarities Between
Audio Captions",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "221-225",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372099"}
@article{bb378005,
AUTHOR = "Yuan, C.S. and Chen, Y.F. and Zhou, Z. and Xia, Z.H. and Huang, Y.F.",
TITLE = "Compressed Domain Invariant Adversarial Representation Learning for
Robust Audio Deepfake Detection",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1111-1115",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372100"}
@article{bb378006,
AUTHOR = "Unoki, M. and Li, K. and Chaiwongyen, A. and Nguyen, Q.H. and Zaman, K.",
TITLE = "Deepfake Speech Detection: Approaches from Acoustic Features to Deep
Neural Networks",
JOURNAL = IEICE,
VOLUME = "E108-D",
YEAR = "2025",
NUMBER = "4",
MONTH = "April",
PAGES = "300-310",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372101"}
@article{bb378007,
AUTHOR = "Shin, U.H. and Ku, B.H. and Park, H.M.",
TITLE = "TF-CorrNet: Leveraging Spatial Correlation for Continuous Speech
Separation",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1875-1879",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372102"}
@article{bb378008,
AUTHOR = "Ta, B.T. and Le, N.M. and Binh, H.T.T. and Do, V.H.",
TITLE = "Exploring Non-Matching Multiple References for Speech Quality
Assessment",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1610-1614",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372103"}
@article{bb378009,
AUTHOR = "Jin, L.B. and Min, D. and Yu, C. and Shin, J.E. and Kim, E.Y.",
TITLE = "Detecting Hearing Impairment Through Localizing Abnormal Speech
Patterns",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1945-1949",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372104"}
@article{bb378010,
AUTHOR = "Liu, D. and Zhang, T.Q. and Wei, Y. and Yi, C. and Christensen, M.G.",
TITLE = "Speech Conv-Mamba: Selective Structured State Space Model With
Temporal Dilated Convolution for Efficient Speech Separation",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "2015-2019",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372105"}
@article{bb378011,
AUTHOR = "Liu, F. and Ai, Y. and Ling, Z.H.",
TITLE = "Token-Prediction-Based Post-Processing for Low-Bitrate Speech Coding",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3235-3239",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372106"}
@article{bb378012,
AUTHOR = "Zhang, Z.X. and Xu, W.X. and Dong, Z. and Wang, K.L. and Wu, Y.M. and Peng, J. and Wang, R. and Huang, D.Y.",
TITLE = "ParaLBench: A Large-Scale Benchmark for Computational Paralinguistics
Over Acoustic Foundation Models",
JOURNAL = AffCom,
VOLUME = "16",
YEAR = "2025",
NUMBER = "3",
MONTH = "July",
PAGES = "1290-1306",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372107"}
@article{bb378013,
AUTHOR = "Yang, Y. and Zhou, C.",
TITLE = "DPARNet-RSE: Toward Angular Region-Customizable Speech Extraction",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3779-3783",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372108"}
@article{bb378014,
AUTHOR = "Zhao, Z.Y. and Peng, Y. and Camilleri, K. and Kong, W.Z. and Cichocki, A.",
TITLE = "Imagined Speech Decoding by Learning Consensus Graph From RKHS-Based
Multi-View EEG Features",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3944-3948",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372109"}
@article{bb378015,
AUTHOR = "Tan, Z.W. and Reju, V.G. and Tewari, R.C. and Ding, R.T. and Khong, A.W.H.",
TITLE = "Joint Enhancement and Bandwidth Extension for Radar Through-Barrier
Speech Acquisition",
JOURNAL = SPLetters,
VOLUME = "33",
YEAR = "2026",
PAGES = "176-180",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372110"}
@article{bb378016,
AUTHOR = "Fu, R. and Tang, L. and Tian, H. and Chang, C.C.",
TITLE = "Fuzzy-Clustering-Based Domain Adaptation for Speech Steganalysis in
Dynamic Scenarios",
JOURNAL = SPLetters,
VOLUME = "33",
YEAR = "2026",
PAGES = "366-370",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372111"}
@article{bb378017,
AUTHOR = "Wang, T. and Yi, J.Y. and Fu, R. and Qiang, C.Y. and Chong, D. and Wang, C. and Dai, D.Y. and Wen, Z.Q. and Tao, J.H.",
TITLE = "SpeechPalette: A Comprehensive Speech Editing Method for Text-Based
Speech Editing, One-Shot TTS and Attributes Editing",
JOURNAL = PAMI,
VOLUME = "48",
YEAR = "2026",
NUMBER = "3",
MONTH = "March",
PAGES = "2596-2609",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372112"}
@article{bb378018,
AUTHOR = "Hu, H.Q. and Liao, Y. and Cai, S.Q. and Li, H.Z.",
TITLE = "The effect of speech representations on EEG-based auditory attention
detection",
JOURNAL = PRL,
VOLUME = "203",
YEAR = "2026",
PAGES = "146-151",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372113"}
@inproceedings{bb378019,
AUTHOR = "Wani, T.M. and Amerini, I.",
TITLE = "Deepfakes Audio Detection Leveraging Audio Spectrogram and
Convolutional Neural Networks",
BOOKTITLE = CIAP23,
YEAR = "2023",
PAGES = "II:156-167",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372114"}
@inproceedings{bb378020,
AUTHOR = "Choi, S. and Oh, S. and Yang, J. and Lee, Y. and Kwak, I.Y.",
TITLE = "Light-weight Frequency Information Aware Neural Network Architecture
for Voice Spoofing Detection",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "477-483",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372115"}
@inproceedings{bb378021,
AUTHOR = "Li, X. and Hu, X. and Chen, X. and Pan, H. and Niu, K.",
TITLE = "Deep Speaker Embedding Using Hybrid Network of Multi-Feature
Aggregation and Multi-Loss Fusion for TI-SV",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "506-512",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372116"}
@inproceedings{bb378022,
AUTHOR = "Zhang, B. and Sim, T.",
TITLE = "Localizing Fake Segments in Speech",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "3224-3230",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372117"}
@inproceedings{bb378023,
AUTHOR = "Teng, Z.W. and Fu, Q. and White, J. and Powell, M.E. and Schmidt, D.C.",
TITLE = "ARawNet: A Lightweight Solution for Leveraging Raw Waveforms in Spoof
Speech Detection",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "692-698",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372118"}
@inproceedings{bb378024,
AUTHOR = "Stefanov, K. and Adiban, M. and Salvi, G.",
TITLE = "Spatial Bias in Vision-Based Voice Activity Detection",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "10433-10440",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372119"}
@inproceedings{bb378025,
AUTHOR = "Barros, F. and Conde, A. and Soares, S.C. and Neves, A.J.R. and Silva, S.",
TITLE = "Understanding Public Speakers' Performance:
First Contributions to Support a Computational Approach",
BOOKTITLE = ICIAR20,
YEAR = "2020",
PAGES = "I:343-355",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372120"}
@inproceedings{bb378026,
AUTHOR = "Bilkova, Z. and Novozamsky, A. and Dominec, A. and Gresko, S. and Zitova, B. and Paroubkova, M.",
TITLE = "Automatic Evaluation of Speech Therapy Exercises Based on Image Data",
BOOKTITLE = ICIAR19,
YEAR = "2019",
PAGES = "I:397-404",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372121"}
@inproceedings{bb378027,
AUTHOR = "Dai, J.J. and Dixon, S.",
TITLE = "Understanding Intonation Trajectories and Patterns of Vocal Notes",
BOOKTITLE = "MMMod19",
YEAR = "2019",
PAGES = "II:243-253",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372122"}
@inproceedings{bb378028,
AUTHOR = "Zheng, S. and Wang, J. and Xiao, J. and Hsu, W. and Glass, J.",
TITLE = "A Noise-Robust Self-Adaptive Multitarget Speaker Detection System",
BOOKTITLE = ICPR18,
YEAR = "2018",
PAGES = "1068-1072",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372123"}
@inproceedings{bb378029,
AUTHOR = "Athanasopoulos, G. and Hagihara, K. and Cierro, A. and Guerit, R. and Chatelain, J. and Lucas, C. and Macq, B.",
TITLE = "3D immersive karaoke for the learning of foreign language
pronunciation",
BOOKTITLE = IC3D17,
YEAR = "2017",
PAGES = "1-8",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372124"}
@inproceedings{bb378030,
AUTHOR = "Serras, M. and Torres, M.I. and del Pozo, A.",
TITLE = "Online Learning of Attributed Bi-Automata for Dialogue Management in
Spoken Dialogue Systems",
BOOKTITLE = IbPRIA17,
YEAR = "2017",
PAGES = "22-31",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372125"}
@inproceedings{bb378031,
AUTHOR = "Nagpal, A. and Patil, H.A.",
TITLE = "Novel Gammatone Filterbank Based Spectro-Temporal Features for Robust
Phoneme Recognition",
BOOKTITLE = PReMI17,
YEAR = "2017",
PAGES = "342-350",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372126"}
@inproceedings{bb378032,
AUTHOR = "Grachev, A.M. and Ignatov, D.I. and Savchenko, A.V.",
TITLE = "Neural Networks Compression for Language Modeling",
BOOKTITLE = PReMI17,
YEAR = "2017",
PAGES = "351-357",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372127"}
@inproceedings{bb378033,
AUTHOR = "Zhang, L. and Chen, J.X. and Luo, Y. and Fu, J.F. and Ye, Z.F.",
TITLE = "Supervised single-channel speech dereverberation and denoising using
a two-stage processing",
BOOKTITLE = ICIVC17,
YEAR = "2017",
PAGES = "818-822",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372128"}
@inproceedings{bb378034,
AUTHOR = "Bedoui, A. and Ben Jebara, S.",
TITLE = "On the use of opening phase slopes of the glottal signal to
characterize unilateral vocal folds paralysis",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "41-46",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372129"}
@inproceedings{bb378035,
AUTHOR = "Ben Ali, F. and Djaziri Larbi, S.",
TITLE = "A very low bit rate codec for wide band speech based on a long-term
perceptual harmonic plus noise model",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "71-76",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372130"}
@inproceedings{bb378036,
AUTHOR = "Ferreira, A.",
TITLE = "Implantation of voicing on whispered speech using frequency-domain
parametric modelling of source and filter information",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "159-166",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372131"}
@inproceedings{bb378037,
AUTHOR = "Pozzebon, A. and Biliotti, F. and Calamai, S.",
TITLE = "Places Speaking with Their Own Voices. A Case Study from the Gra.fo
Archives",
BOOKTITLE = EuroMed16,
YEAR = "2016",
PAGES = "II: 232-239",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372132"}
@inproceedings{bb378038,
AUTHOR = "Vlaj, D. and Kos, M. and Kacic, Z.",
TITLE = "Quick and efficient definition of hangbefore and hangover criteria
for voice activity detection",
BOOKTITLE = WSSIP16,
YEAR = "2016",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372133"}
@inproceedings{bb378039,
AUTHOR = "Ballesteros L, D.M. and Renza, D. and Camacho, S.",
TITLE = "High Scrambling Degree in Audio Through Imitation of an Unintelligible
Signal",
BOOKTITLE = MCPR16,
YEAR = "2016",
PAGES = "251-259",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372134"}
@inproceedings{bb378040,
AUTHOR = "Onchis, D.M. and Real, P.",
TITLE = "On Homotopy Continuation for Speech Restoration",
BOOKTITLE = CTIC16,
YEAR = "2016",
PAGES = "152-156",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372135"}
@inproceedings{bb378041,
AUTHOR = "Dubey, M.L. and Shultz, P.F. and Kenyon, G.T.",
TITLE = "Learning phase-rich features from streaming auditory images",
BOOKTITLE = Southwest16,
YEAR = "2016",
PAGES = "73-76",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372136"}
@inproceedings{bb378042,
AUTHOR = "Montalvo, A. and Costa, Y.M.G. and Calvo, J.R.",
TITLE = "Language Identification Using Spectrogram Texture",
BOOKTITLE = CIARP15,
YEAR = "2015",
PAGES = "543-550",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372137"}
@inproceedings{bb378043,
AUTHOR = "Aizezi, Y. and Jamal, A. and Mamat, D. and Abdurexit, R. and Ubul, K.",
TITLE = "Analytical Method and Research of Uyghur Language Chunks Based on
Digital Forensics",
BOOKTITLE = ISCA15,
YEAR = "2015",
PAGES = "258-266",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372138"}
@inproceedings{bb378044,
AUTHOR = "Hammami, N. and Bedda, M. and Farah, N. and Mansouri, S.",
TITLE = "R-Letter disorder diagnosis (R-LDD): Arabic speech database
development for automatic diagnosis of childhood speech disorders
(Case study)",
BOOKTITLE = ISCV15,
YEAR = "2015",
PAGES = "1-7",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372139"}
@inproceedings{bb378045,
AUTHOR = "Nakajima, J. and Kimura, A. and Sugimoto, A. and Kashino, K.",
TITLE = "Visual Attention Driven by Auditory Cues",
BOOKTITLE = MMMod15,
YEAR = "2015",
PAGES = "II: 74-86",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372140"}
@inproceedings{bb378046,
AUTHOR = "Ishikura, K. and Uemura, A. and Katto, J.",
TITLE = "Live Version Identification with Audio Scene Detection",
BOOKTITLE = MMMod15,
YEAR = "2015",
PAGES = "I: 408-417",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372141"}
@inproceedings{bb378047,
AUTHOR = "Xie, S.B. and Yang, Y.H. and Hu, R.M. and Wang, Y.Y. and Yu, H.J. and Dong, S.L. and Gao, L. and Yang, C.",
TITLE = "Signal-Aware Parametric Quality Model for Audio and Speech over IP
Networks",
BOOKTITLE = MMMod15,
YEAR = "2015",
PAGES = "I: 487-497",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372142"}
@inproceedings{bb378048,
AUTHOR = "Xue, L. and Su, F.",
TITLE = "Auditory Scene Classification with Deep Belief Network",
BOOKTITLE = MMMod15,
YEAR = "2015",
PAGES = "I: 348-359",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372143"}
@inproceedings{bb378049,
AUTHOR = "Tu, M. and Xie, X. and Na, X.Y.",
TITLE = "Computational Auditory Scene Analysis Based Voice Activity Detection",
BOOKTITLE = ICPR14,
YEAR = "2014",
PAGES = "797-802",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372144"}
@inproceedings{bb378050,
AUTHOR = "Lu, T. and Weng, Y.B. and Wang, G.Y.",
TITLE = "Audiotory Movie Summarization by Detecting Scene Changes and Sound
Events",
BOOKTITLE = ICPR14,
YEAR = "2014",
PAGES = "756-760",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372145"}
@inproceedings{bb378051,
AUTHOR = "Nguyen Son, H.Q. and Hoang, A.T. and Tran, M.T. and Yoshiura, H. and Sonehara, N. and Echizen, I.",
TITLE = "Anonymizing Temporal Phrases in Natural Language Text to be Posted on
Social Networking Services",
BOOKTITLE = IWDW13,
YEAR = "2013",
PAGES = "437-451",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372146"}
@inproceedings{bb378052,
AUTHOR = "Maka, T. and Dziurzanski, P.",
TITLE = "Feature contours fusion for determining segment boundaries in audio
data",
BOOKTITLE = WSSIP14,
YEAR = "2014",
PAGES = "111-114",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372147"}
@inproceedings{bb378053,
AUTHOR = "Souza, D. and Saturnino, L. and Maciel, A.M.A.",
TITLE = "A portability evaluation of Brazilian Portuguese voices produced with
MARY TTS",
BOOKTITLE = WSSIP14,
YEAR = "2014",
PAGES = "95-98",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372148"}
@inproceedings{bb378054,
AUTHOR = "Frid, A. and Lavner, Y.Z.",
TITLE = "Spectral and textural features for automatic classification of
fricatives using SVM",
BOOKTITLE = WSSIP14,
YEAR = "2014",
PAGES = "99-102",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372149"}
@inproceedings{bb378055,
AUTHOR = "Savchenko, A.V.",
TITLE = "Semi-automated Speaker Adaptation:
How to Control the Quality of Adaptation?",
BOOKTITLE = ICISP14,
YEAR = "2014",
PAGES = "638-646",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372150"}
@inproceedings{bb378056,
AUTHOR = "Merazka, F.",
TITLE = "Wideband Speech Encryption Based Arnold Cat Map for AMR-WB G.722.2
Codec",
BOOKTITLE = ICISP14,
YEAR = "2014",
PAGES = "658-664",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372151"}
@inproceedings{bb378057,
AUTHOR = "Souli, S. and Lachiri, Z. and Kuznietsov, A.",
TITLE = "Using Three Reassigned Spectrogram Patches and Log-Gabor Filter for
Audio Surveillance Application",
BOOKTITLE = CIARP13,
YEAR = "2013",
PAGES = "I:527-534",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372152"}
@inproceedings{bb378058,
AUTHOR = "Joseph, S.M. and Babu, A.P.",
TITLE = "Continuous speech coding using coiflets wavelet",
BOOKTITLE = ICSIPR13,
YEAR = "2013",
PAGES = "253-257",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372153"}
@inproceedings{bb378059,
AUTHOR = "Nivedita, D. and Kavita, T. and Zadgaonkar, A.S.",
TITLE = "First degree heart block determination from speech analysis",
BOOKTITLE = ICSIPR13,
YEAR = "2013",
PAGES = "103-106",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372154"}
@article{bb378060,
AUTHOR = "Sadjadi, S.O. and Hansen, J.H.L.",
TITLE = "Unsupervised Speech Activity Detection Using Voicing Measures and
Perceptual Spectral Flux",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "3",
MONTH = "March",
PAGES = "197-200",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372155"}
@inproceedings{bb378061,
AUTHOR = "Zhang, L. and Li, H.F. and Ma, L.",
TITLE = "An adaptive unsupervised clustering of pronunciation errors for
automatic pronunciation error detection",
BOOKTITLE = ICPR12,
YEAR = "2012",
PAGES = "1521-1525",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372156"}
@inproceedings{bb378062,
AUTHOR = "Rosales Perez, A. and Reyes Garcia, C.A. and Gonzalez, J.A. and Arch Tirado, E.",
TITLE = "Infant Cry Classification Using Genetic Selection of a Fuzzy Model",
BOOKTITLE = CIARP12,
YEAR = "2012",
PAGES = "212-219",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372157"}
@inproceedings{bb378063,
AUTHOR = "Gonzalez, D.C. and Ling, L.L. and Violaro, F.",
TITLE = "Analysis of the Multifractal Nature of Speech Signals",
BOOKTITLE = CIARP12,
YEAR = "2012",
PAGES = "740-748",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372158"}
@inproceedings{bb378064,
AUTHOR = "Tanveer, S. and Muhammad, A. and Martinez Enriquez, A.M. and Escalada Imaz, G.",
TITLE = "Phonetic Unification of Multiple Accents for Spanish and Arabic
Languages",
BOOKTITLE = MCPR12,
YEAR = "2012",
PAGES = "323-333",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372159"}
@inproceedings{bb378065,
AUTHOR = "Falek, L. and Teffahi, H. and Djeradi, A.",
TITLE = "Methodology for Acoustic Characterization of a Labial Constraint in
Speech Production",
BOOKTITLE = ICISP12,
YEAR = "2012",
PAGES = "131-141",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372160"}
@inproceedings{bb378066,
AUTHOR = "Krum, D.M. and Suma, E.A. and Bolas, M.",
TITLE = "Spatial misregistration of virtual human audio:
Implications of the precedence effect",
BOOKTITLE = "3DUI12",
YEAR = "2012",
PAGES = "147-148",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372161"}
@inproceedings{bb378067,
AUTHOR = "Yang, Y.J. and Zhang, H.H. and Guo, X.",
TITLE = "A pitch tracking method mixing ACF and AMDF algorithms based on
correlations",
BOOKTITLE = IASP11,
YEAR = "2011",
PAGES = "553-556",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372162"}
@inproceedings{bb378068,
AUTHOR = "Guo, S. and Gao, L. and Yu, H.Z.",
TITLE = "Research on Lhasa Tibetan prosodic model of journalese based on
respiratory signal",
BOOKTITLE = IASP11,
YEAR = "2011",
PAGES = "26-30",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372163"}
@inproceedings{bb378069,
AUTHOR = "Resmi, K. and Kumar, S. and Sardana, H.K. and Chhabra, R.",
TITLE = "Graphical Speech Training system for hearing impaired",
BOOKTITLE = ICIIP11,
YEAR = "2011",
PAGES = "1-6",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372164"}
@inproceedings{bb378070,
AUTHOR = "Gomez, J.A. and Calvo, M.",
TITLE = "Improvements on Automatic Speech Segmentation at the Phonetic Level",
BOOKTITLE = CIARP11,
YEAR = "2011",
PAGES = "557-564",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372165"}
@inproceedings{bb378071,
AUTHOR = "Le, P.N. and Epps, J. and Choi, E.H.C. and Ambikairajah, E.",
TITLE = "A Study of Voice Source and Vocal Tract Filter Based Features in
Cognitive Load Classification",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "4516-4519",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372166"}
@inproceedings{bb378072,
AUTHOR = "Stark, M. and Wohlmayr, M. and Pernkopf, F.",
TITLE = "Single Channel Speech Separation Using Source-Filter Representation",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "826-829",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372167"}
@inproceedings{bb378073,
AUTHOR = "Stadelmann, T. and Wang, Y.H. and Smith, M. and Ewerth, R. and Freisleben, B.",
TITLE = "Rethinking Algorithm Design and Development in Speech Processing",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "4476-4479",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372168"}
@inproceedings{bb378074,
AUTHOR = "Gonzalez Caravaca, G. and Toledano, D.T. and Puertas, M.",
TITLE = "Phone-Conditioned Suboptimal Wiener Filtering",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "4480-4483",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372169"}
@inproceedings{bb378075,
AUTHOR = "Sepehr, H. and Nooralahiyan, A.Y. and Brennan, P.V.",
TITLE = "Improving Performance of a Noise Reduction Algorithm by Switching the
Analysis Filter Bank",
BOOKTITLE = ICISP10,
YEAR = "2010",
PAGES = "262-271",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372170"}
@inproceedings{bb378076,
AUTHOR = "Kos, M. and Grasic, M. and Vlaj, D. and Kacic, Z.",
TITLE = "On-Line Speech/Music Segmentation for Broadcast News Domain",
BOOKTITLE = WSSIP09,
YEAR = "2009",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372171"}
@inproceedings{bb378077,
AUTHOR = "Grasic, M. and Kos, M. and Vlaj, D. and Kacic, Z.",
TITLE = "The Influence of Speech/Non-Speech Segmentation on On-Line and Off-Line
Speaker Segmentation Accuracy",
BOOKTITLE = WSSIP09,
YEAR = "2009",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372172"}
@inproceedings{bb378078,
AUTHOR = "Zuta, V.",
TITLE = "Voice Pleasantness of Female Voices and the Assessment of Physical
Characteristics",
BOOKTITLE = COST08,
YEAR = "2008",
PAGES = "116-125",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372173"}
@inproceedings{bb378079,
AUTHOR = "Stadelmann, T. and Heinzl, S. and Unterberger, M. and Freisleben, B.",
TITLE = "WebVoice: A Toolkit for Perceptual Insights into Speech Processing",
BOOKTITLE = CISP09,
YEAR = "2009",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372174"}
@inproceedings{bb378080,
AUTHOR = "Tang, Y.B. and Huang, R. and Wu, Z.Y.",
TITLE = "A 2.4kbps Multiband Characteristic Waveform Interpolation Speech Coding
Algorithm",
BOOKTITLE = CISP09,
YEAR = "2009",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372175"}
@inproceedings{bb378081,
AUTHOR = "Zou, X. and Zhang, X.W.",
TITLE = "A 450bps Speech Coding Algorithm Based on Multi-Mode Matrix
Quantization",
BOOKTITLE = CISP09,
YEAR = "2009",
PAGES = "1-3",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372176"}
@inproceedings{bb378082,
AUTHOR = "Li, X.K. and Deng, Y.",
TITLE = "Combining speech energy and edge information for fast and efficient
voice activity detection in noisy environments",
BOOKTITLE = ICPR08,
YEAR = "2008",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372177"}
@inproceedings{bb378083,
AUTHOR = "Kukharchik, P. and Kheidorov, I. and Bovbel, E. and Ladeev, D.",
TITLE = "Speech Signal Processing Based on Wavelets and SVM for Vocal Tract
Pathology Detection",
BOOKTITLE = ICISP08,
YEAR = "2008",
PAGES = "192-199",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372178"}
@inproceedings{bb378084,
AUTHOR = "Nagesha and Kumar, G.H.",
TITLE = "Signal Resampling Technique Combining Level Crossing and Auditory
Features",
BOOKTITLE = PReMI07,
YEAR = "2007",
PAGES = "447-454",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372179"}
@inproceedings{bb378085,
AUTHOR = "Varallyay, G.",
TITLE = "SSM: A Novel Method to Recognize the Fundamental Frequency in Voice
Signals",
BOOKTITLE = CIARP07,
YEAR = "2007",
PAGES = "88-95",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372180"}
@inproceedings{bb378086,
AUTHOR = "Ferrer, C.A. and Gonzalez, E. and Hernandez Diaz, M.E.",
TITLE = "Evaluation of Time and Frequency Domain-Based Methods for the
Estimation of Harmonics-to-Noise-Ratios in Voice Signals",
BOOKTITLE = CIARP06,
YEAR = "2006",
PAGES = "406-415",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372181"}
@inproceedings{bb378087,
AUTHOR = "Xue, W. and Du, S. and Fang, C.Z. and Ye, Y.X.",
TITLE = "Voice Activity Detection Using Wavelet-Based Multiresolution Spectrum
and Support Vector Machines and Audio Mixing Algorithm",
BOOKTITLE = CVHCI06,
YEAR = "2006",
PAGES = "78-88",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372182"}
@inproceedings{bb378088,
AUTHOR = "Garcia Perera, L.P. and Nolazco Flores, J.A. and Mex Perera, C.",
TITLE = "Cryptographic-Speech-Key Generation Architecture Improvements",
BOOKTITLE = IbPRIA05,
YEAR = "2005",
PAGES = "II:579",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372183"}
@inproceedings{bb378089,
AUTHOR = "Welk, M. and Bergmeister, A. and Weickert, J.",
TITLE = "Denoising of Audio Data by Nonlinear Diffusion",
BOOKTITLE = ScaleSpace05,
YEAR = "2005",
PAGES = "598-609",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372184"}
@inproceedings{bb378090,
AUTHOR = "Cristani, M. and Bicego, M. and Murino, V.",
TITLE = "On-line adaptive background modelling for audio surveillance",
BOOKTITLE = ICPR04,
YEAR = "2004",
PAGES = "II: 399-402",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372185"}
@inproceedings{bb378091,
AUTHOR = "Lefevre, S. and Maillard, B. and Vincent, N.",
TITLE = "A two level classifier process for audio segmentation",
BOOKTITLE = ICPR02,
YEAR = "2002",
PAGES = "III: 891-894",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372186"}
@inproceedings{bb378092,
AUTHOR = "de Stefano, C. and Della Cioppa, A. and Marcelli, A.",
TITLE = "An investigation on MPEG audio segmentation by evolutionary algorithms",
BOOKTITLE = ICDAR01,
YEAR = "2001",
PAGES = "952-956",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372187"}
@inproceedings{bb378093,
AUTHOR = "Edmonds, E.A. and Pan, L.Y. and O'Brien, S.M.",
TITLE = "Automatic feature extraction from spectrograms for acoustic-phonetic
analysis",
BOOKTITLE = ICPR92,
YEAR = "1992",
PAGES = "II:701-704",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT372188"}
@article{bb378094,
AUTHOR = "Mumolo, E.",
TITLE = "Spectral domain texture analysis for speech enhancement",
JOURNAL = PR,
VOLUME = "35",
YEAR = "2002",
NUMBER = "10",
MONTH = "October",
PAGES = "2181-2191",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372189"}
@article{bb378095,
AUTHOR = "Chang, J.H. and Gazor, S. and Kim, N.S. and Mitra, S.K.",
TITLE = "Multiple statistical models for soft decision in noisy speech
enhancement",
JOURNAL = PR,
VOLUME = "40",
YEAR = "2007",
NUMBER = "3",
MONTH = "March",
PAGES = "1123-1134",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372190"}
@article{bb378096,
AUTHOR = "Esch, T. and Rungeler, M. and Heese, F. and Vary, P.",
TITLE = "Estimation of Rapidly Time-Varying Harmonic Noise for Speech
Enhancement",
JOURNAL = SPLetters,
VOLUME = "19",
YEAR = "2012",
NUMBER = "10",
MONTH = "October",
PAGES = "659-662",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372191"}
@article{bb378097,
AUTHOR = "Mohammadiha, N. and Martin, R. and Leijon, A.",
TITLE = "Spectral Domain Speech Enhancement Using HMM State-Dependent
Super-Gaussian Priors",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "3",
MONTH = "March",
PAGES = "253-256",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372192"}
@article{bb378098,
AUTHOR = "Taal, C.H. and Jensen, J. and Leijon, A.",
TITLE = "On Optimal Linear Filtering of Speech for Near-End Listening
Enhancement",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "3",
MONTH = "March",
PAGES = "225-228",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372193"}
@article{bb378099,
AUTHOR = "Szurley, J. and Bertrand, A. and Moonen, M.",
TITLE = "On the Use of Time-Domain Widely Linear Filtering
for Binaural Speech Enhancement",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "7",
PAGES = "649-652",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024spen2.html#TT372194"}
Last update:Apr 6, 2026 at 11:28:57