Keith Price Bibliography Bibtex Entry (ANCHOR 378800 URL http://dx.doi.org/10.1109/TSMCA.2012.2210413 PAGES 76-91 YEAR 2013 MONTH January NUMBER 1 BIBSOURCE http://www.visionbib.com/bibliography/other1023.html#TT372893 VOLUME 43 JOURNAL HMS AUTHOR Keefer, R. and Liu, Y. and Bourbakis, N. TITLE The Development and Evaluation of an Eyes-Free Interaction Model for Mobile Reading Devices)


@article{bb378800,
        AUTHOR = "Keefer, R. and Liu, Y. and Bourbakis, N.",
        TITLE = "The Development and Evaluation of an Eyes-Free Interaction Model for
Mobile Reading Devices",
        JOURNAL = HMS,
        VOLUME = "43",
        YEAR = "2013",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "76-91",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372893"}

@article{bb378801,
        AUTHOR = "O'Shaughnessy, D. and Deng, L. and Li, H.",
        TITLE = "Speech Information Processing: Theory and Applications",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1034-1037",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372894"}

@article{bb378802,
        AUTHOR = "O'Shaughnessy, D.",
        TITLE = "Acoustic Analysis for Automatic Speech Recognition",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1038-1053",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372895"}

@article{bb378803,
        AUTHOR = "Fosler Lussier, E. and He, Y. and Jyothi, P. and Prabhavalkar, R.",
        TITLE = "Conditional Random Fields in Speech, Audio, and Language Processing",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1054-1075",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372896"}

@article{bb378804,
        AUTHOR = "Hermansky, H.",
        TITLE = "Multistream Recognition of Speech: Dealing With Unknown Unknowns",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1076-1088",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372897"}

@article{bb378805,
        AUTHOR = "Lee, C.H. and Siniscalchi, S.M.",
        TITLE = "An Information-Extraction Approach to Speech Processing: Analysis,
Detection, Verification, and Recognition",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1089-1115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372898"}

@article{bb378806,
        AUTHOR = "He, X. and Deng, L.",
        TITLE = "Speech-Centric Information Processing: An Optimization-Oriented
Approach",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1116-1135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372899"}

@article{bb378807,
        AUTHOR = "Young, S. and Gasic, M. and Thomson, B. and Williams, J.D.",
        TITLE = "POMDP-Based Statistical Spoken Dialog Systems: A Review",
        JOURNAL = PIEEE,
        VOLUME = "100",
        YEAR = "2013",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1160-1179",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372900"}

@article{bb378808,
        AUTHOR = "Li, W.F. and Zhou, Y.C. and Poh, N. and Zhou, F. and Liao, Q.M.",
        TITLE = "Feature Denoising Using Joint Sparse Representation for
In-Car Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "7",
        PAGES = "681-684",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372901"}

@article{bb378809,
        AUTHOR = "Hermansky, H. and Cohen, J.R. and Stern, R.M.",
        TITLE = "Perceptual Properties of Current Speech Recognition Technology",
        JOURNAL = PIEEE,
        VOLUME = "101",
        YEAR = "2013",
        NUMBER = "9",
        PAGES = "1968-1985",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372902"}

@article{bb378810,
        AUTHOR = "Kolossa, D. and Zeiler, S. and Saeidi, R. and Astudillo, R.F.",
        TITLE = "Noise-Adaptive LDA: A New Approach for Speech Recognition Under
Observation Uncertainty",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "11",
        PAGES = "1018-1021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372903"}

@article{bb378811,
        AUTHOR = "Saeidi, R. and Astudillo, R.F. and Kolossa, D.",
        TITLE = "Uncertain LDA: Including Observation Uncertainties in Discriminative
Transforms",
        JOURNAL = PAMI,
        VOLUME = "38",
        YEAR = "2016",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1479-1488",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372904"}

@article{bb378812,
        AUTHOR = "Kim, K.T. and Lin, K.H. and Walther, D.B. and Hasegawa Johnson, M.A. and Huang, T.S.",
        TITLE = "Automatic detection of auditory salience with optimized linear
filters derived from human annotation",
        JOURNAL = PRL,
        VOLUME = "38",
        YEAR = "2014",
        NUMBER = "1",
        PAGES = "78-85",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372905"}

@article{bb378813,
        AUTHOR = "Huang, X.D. and Baker, J. and Reddy, R.",
        TITLE = "A Historical Perspective of Speech Recognition",
        JOURNAL = CACM,
        VOLUME = "57",
        YEAR = "2014",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "94-103",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372906"}

@article{bb378814,
        AUTHOR = "Shi, Y.Z. and Zhang, W.Q. and Cai, M. and Liu, J.",
        TITLE = "Efficient One-Pass Decoding with NNLM for Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "377-381",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372907"}

@article{bb378815,
        AUTHOR = "Zhang, W.B. and Fung, P.",
        TITLE = "Efficient Sparse Banded Acoustic Models for Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "280-283",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372908"}

@article{bb378816,
        AUTHOR = "Triefenbach, F. and Demuynck, K. and Martens, J.P.",
        TITLE = "Large Vocabulary Continuous Speech Recognition With Reservoir-Based
Acoustic Models",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "311-315",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372909"}

@article{bb378817,
        AUTHOR = "Diez, M. and Varona, A. and Penagarikano, M. and Rodriguez Fuentes, L.J. and Bordel, G.",
        TITLE = "On the Complementarity of Phone Posterior Probabilities for Improved
Speaker Recognition",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "649-652",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372910"}

@inproceedings{bb378818,
        AUTHOR = "Diez, M. and Penagarikano, M. and Varona, A. and Rodriguez Fuentes, L.J. and Bordel, G.",
        TITLE = "On the Use of Dot Scoring for Speaker Diarization",
        BOOKTITLE = IbPRIA11,
        YEAR = "2011",
        PAGES = "612-619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372911"}

@article{bb378819,
        AUTHOR = "Rasanen, O. and Laine, U.K.",
        TITLE = "A method for noise-robust context-aware pattern discovery and
recognition from categorical sequences",
        JOURNAL = PR,
        VOLUME = "45",
        YEAR = "2012",
        NUMBER = "1",
        PAGES = "606-616",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372912"}

@article{bb378820,
        AUTHOR = "Liu, N.H.",
        TITLE = "Effective Results Ranking for Mobile Query by Singing/Humming Using a
Hybrid Recommendation Mechanism",
        JOURNAL = MultMed,
        VOLUME = "16",
        YEAR = "2014",
        NUMBER = "5",
        MONTH = "August",
        PAGES = "1407-1420",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372913"}

@article{bb378821,
        AUTHOR = "Schneiderman, R.",
        TITLE = "Accuracy, Apps Advance Speech Recognition",
        JOURNAL = SPMag,
        VOLUME = "32",
        YEAR = "2015",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "12-125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372914"}

@article{bb378822,
        AUTHOR = "Ban, S.M. and Kim, H.S.",
        TITLE = "Weight-Space Viterbi Decoding Based Spectral Subtraction for
Reverberant Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "22",
        YEAR = "2015",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1424-1428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372915"}

@article{bb378823,
        AUTHOR = "Sakano, T. and Kobayashi, Y. and Kondo, K.",
        TITLE = "A Speech Intelligibility Estimation Method Using a Non-reference
Feature Set",
        JOURNAL = IEICE,
        VOLUME = "E98-D",
        YEAR = "2015",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "21-28",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372916"}

@article{bb378824,
        AUTHOR = "Khaldi, K. and Boudraa, A.O. and Torresani, B. and Chonavel, T.",
        TITLE = "HHT-based audio coding",
        JOURNAL = SIViP,
        VOLUME = "9",
        YEAR = "2015",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "107-115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372917"}

@article{bb378825,
        AUTHOR = "Savchenko, A.V. and Savchenko, L.V.",
        TITLE = "Towards the creation of reliable voice control system based on a
fuzzy approach",
        JOURNAL = PRL,
        VOLUME = "65",
        YEAR = "2015",
        NUMBER = "1",
        PAGES = "145-151",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372918"}

@article{bb378826,
        AUTHOR = "Suh, Y.J. and Kim, H.",
        TITLE = "Probabilistic Class Histogram Equalization Based on Posterior Mean
Estimation for Robust Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "22",
        YEAR = "2015",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "2421-2424",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372919"}

@article{bb378827,
        AUTHOR = "Wang, X.Y. and Yamamoto, S.",
        TITLE = "Speech Recognition of English by Japanese Using Lexicon
Represented by Multiple Reduced Phoneme Sets",
        JOURNAL = IEICE,
        VOLUME = "E98-D",
        YEAR = "2015",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "2271-2279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372920"}

@article{bb378828,
        AUTHOR = "Tohidypour, H.R. and Banitalebi Dehkordi, A.",
        TITLE = "Speech frame recognition based on less shift sensitive wavelet filter
banks",
        JOURNAL = SIViP,
        VOLUME = "10",
        YEAR = "2016",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "633-637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372921"}

@article{bb378829,
        AUTHOR = "Ansari, J.A. and Sathyamurthy, A. and Balasubramanyam, R.",
        TITLE = "An Open Voice Command Interface Kit",
        JOURNAL = HMS,
        VOLUME = "46",
        YEAR = "2016",
        NUMBER = "3",
        MONTH = "June",
        PAGES = "467-473",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372922"}

@article{bb378830,
        AUTHOR = "Cho, B.J. and Kwon, H. and Cho, J.W. and Kim, C. and Stern, R.M. and Park, H.M.",
        TITLE = "A Subband-Based Stationary-Component Suppression Method Using
Harmonics and Power Ratio for Reverberant Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "23",
        YEAR = "2016",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "780-784",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372923"}

@article{bb378831,
        AUTHOR = "Ren, H. and Yan, Y.",
        TITLE = "Structural Optimization and Online Evolutionary Learning for Spoken
Dialog Management",
        JOURNAL = SPLetters,
        VOLUME = "23",
        YEAR = "2016",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1013-1017",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372924"}

@article{bb378832,
        AUTHOR = "Khoubrouy, S.A. and Hansen, J.H.L.",
        TITLE = "Microphone Array Processing Strategies for Distant-Based Automatic
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "23",
        YEAR = "2016",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1344-1348",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372925"}

@article{bb378833,
        AUTHOR = "Lamberti, F. and Manuri, F. and Paravati, G. and Piumatti, G. and Sanna, A.",
        TITLE = "Using Semantics to Automatically Generate Speech Interfaces for
Wearable Virtual and Augmented Reality Applications",
        JOURNAL = HMS,
        VOLUME = "47",
        YEAR = "2017",
        NUMBER = "1",
        MONTH = "February",
        PAGES = "152-164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372926"}

@article{bb378834,
        AUTHOR = "Ganapathy, S.",
        TITLE = "Multivariate Autoregressive Spectrogram Modeling for Noisy Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1373-1377",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372927"}

@article{bb378835,
        AUTHOR = "Monroe, D.",
        TITLE = "Digital Hearing",
        JOURNAL = CACM,
        VOLUME = "60",
        YEAR = "2017",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "18-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372928"}

@article{bb378836,
        AUTHOR = "Kim, J. and Hahn, M.",
        TITLE = "Voice Activity Detection Using an Adaptive Context Attention Model",
        JOURNAL = SPLetters,
        VOLUME = "25",
        YEAR = "2018",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1181-1185",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372929"}

@article{bb378837,
        AUTHOR = "Edwards, J.",
        TITLE = "Something to Talk About: Signal Processing in Speech and Audiology
Research: Promising Investigations Explore New Opportunities in Human
Communication",
        JOURNAL = SPMag,
        VOLUME = "35",
        YEAR = "2018",
        NUMBER = "6",
        MONTH = "November",
        PAGES = "8-12",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372930"}

@article{bb378838,
        AUTHOR = "Shin, Y. and Yoo, K.M. and Lee, S.",
        TITLE = "Utterance Generation With Variational Auto-Encoder for Slot Filling
in Spoken Language Understanding",
        JOURNAL = SPLetters,
        VOLUME = "26",
        YEAR = "2019",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "505-509",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372931"}

@article{bb378839,
        AUTHOR = "Yang, B.H. and Yao, Z.P. and Lu, H. and Zhou, Y.Q. and Xu, J.K.",
        TITLE = "In-classroom learning analytics based on student behavior, topic and
teaching characteristic mining",
        JOURNAL = PRL,
        VOLUME = "129",
        YEAR = "2020",
        PAGES = "224-231",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372932"}

@article{bb378840,
        AUTHOR = "Chandrakala, S. and Jayalakshmi, S.L.",
        TITLE = "Generative Model Driven Representation Learning in a Hybrid Framework
for Environmental Audio Scene and Sound Event Recognition",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "3-14",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372933"}

@article{bb378841,
        AUTHOR = "Yadav, I.C. and Pradhan, G.",
        TITLE = "Significance of Pitch-Based Spectral Normalization for Children's
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "26",
        YEAR = "2019",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "1822-1826",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372934"}

@article{bb378842,
        AUTHOR = "Shahnawazuddin, S. and Adiga, N. and Kathania, H.K. and Sai, B.T.",
        TITLE = "Creating speaker independent ASR system through prosody modification
based data augmentation",
        JOURNAL = PRL,
        VOLUME = "131",
        YEAR = "2020",
        PAGES = "213-218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372935"}

@article{bb378843,
        AUTHOR = "Park, T.J. and Han, K.J. and Kumar, M. and Narayanan, S.",
        TITLE = "Auto-Tuning Spectral Clustering for Speaker Diarization Using
Normalized Maximum Eigengap",
        JOURNAL = SPLetters,
        VOLUME = "27",
        YEAR = "2020",
        PAGES = "381-385",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372936"}

@article{bb378844,
        AUTHOR = "Deb, S. and Dandapat, S. and Krajewski, J.",
        TITLE = "Analysis and Classification of Cold Speech Using Variational Mode
Decomposition",
        JOURNAL = AffCom,
        VOLUME = "11",
        YEAR = "2020",
        NUMBER = "2",
        MONTH = "April",
        PAGES = "296-307",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372937"}

@article{bb378845,
        AUTHOR = "Sanchez Junquera, J. and Villasenor Pineda, L. and Montes y Gomez, M. and Rosso, P. and Stamatatos, E.",
        TITLE = "Masking domain-specific information for cross-domain deception
detection",
        JOURNAL = PRL,
        VOLUME = "135",
        YEAR = "2020",
        PAGES = "122-130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372938"}

@inproceedings{bb378846,
        AUTHOR = "Rill Garcia, R. and Villasenor Pineda, L. and Reyes Meza, V. and Escalante, H.J.",
        TITLE = "From Text to Speech: A Multimodal Cross-Domain Approach for Deception
Detection",
        BOOKTITLE = MIPPSNA18,
        YEAR = "2018",
        PAGES = "164-177",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372939"}

@article{bb378847,
        AUTHOR = "Lim, H. and Kim, Y. and Kim, H.",
        TITLE = "Cross-Informed Domain Adversarial Training for Noise-Robust Wake-Up
Word Detection",
        JOURNAL = SPLetters,
        VOLUME = "27",
        YEAR = "2020",
        PAGES = "1769-1773",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372940"}

@article{bb378848,
        AUTHOR = "Zhao, L. and Zhang, A. and Liu, Y. and Fei, H.",
        TITLE = "Encoding multi-granularity structural information for joint Chinese
word segmentation and POS tagging",
        JOURNAL = PRL,
        VOLUME = "138",
        YEAR = "2020",
        PAGES = "163-169",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372941"}

@article{bb378849,
        AUTHOR = "Bang, J. and Han, S. and Lee, J.H.",
        TITLE = "Listening-oriented response generation by exploiting user responses",
        JOURNAL = PRL,
        VOLUME = "140",
        YEAR = "2020",
        PAGES = "230-237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372942"}

@article{bb378850,
        AUTHOR = "Zhou, J.T.Y. and Zhang, H. and Jin, D. and Peng, X.",
        TITLE = "Dual Adversarial Transfer for Sequence Labeling",
        JOURNAL = PAMI,
        VOLUME = "43",
        YEAR = "2021",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "434-446",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372943"}

@article{bb378851,
        AUTHOR = "Chen, N. and Watanabe, S. and Villalba, J. and Zelasko, P. and Dehak, N.",
        TITLE = "Non-Autoregressive Transformer for Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "121-125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372944"}

@article{bb378852,
        AUTHOR = "Haeb Umbach, R. and Heymann, J. and Drude, L. and Watanabe, S. and Delcroix, M. and Nakatani, T.",
        TITLE = "Far-Field Automatic Speech Recognition",
        JOURNAL = PIEEE,
        VOLUME = "109",
        YEAR = "2021",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "124-148",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372945"}

@article{bb378853,
        AUTHOR = "Fritsch, J. and Magimai Doss, M.",
        TITLE = "Utterance Verification-Based Dysarthric Speech Intelligibility
Assessment Using Phonetic Posterior Features",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "224-228",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372946"}

@article{bb378854,
        AUTHOR = "Lu, L. and Kanda, N. and Li, J.Y. and Gong, Y.F.",
        TITLE = "Streaming End-to-End Multi-Talker Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "803-807",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372947"}

@article{bb378855,
        AUTHOR = "Yi, C. and Zhou, S.Y. and Xu, B.",
        TITLE = "Efficiently Fusing Pretrained Acoustic and Linguistic Encoders for
Low-Resource Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "788-792",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372948"}

@article{bb378856,
        AUTHOR = "Xu, P. and Huang, Y. and Yuan, T. and Xiang, T. and Hospedales, T.M. and Song, Y.Z. and Wang, L.",
        TITLE = "On Learning Semantic Representations for Large-Scale Abstract
Sketches",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "3366-3379",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372949"}

@article{bb378857,
        AUTHOR = "Kim, J. and Lee, Y.",
        TITLE = "Improving End-to-End Contextual Speech Recognition via a
Word-Matching Algorithm With Backward Search",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "2087-2091",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372950"}

@article{bb378858,
        AUTHOR = "Zhu, S. and Zhang, Y. and He, K. and Zhao, L.",
        TITLE = "Acoustic Word Embedding Based on Multi-Head Attention Quadruplet
Network",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "184-188",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372951"}

@article{bb378859,
        AUTHOR = "Tiwari, R. and Sharma, V. and Sahoo, R.C.",
        TITLE = "Isolated spoken word recognition using packed-MFCC on padded-voice
signal for unscripted languages",
        JOURNAL = IJCVR,
        VOLUME = "12",
        YEAR = "2022",
        NUMBER = "2",
        PAGES = "120-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372952"}

@article{bb378860,
        AUTHOR = "Tian, Z.K. and Yi, J.Y. and Tao, J.H. and Zhang, S. and Wen, Z.Q.",
        TITLE = "Hybrid Autoregressive and Non-Autoregressive Transformer Models for
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "762-766",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372953"}

@article{bb378861,
        AUTHOR = "Xiao, F.Y. and Guan, J. and Lan, H.Y. and Zhu, Q. and Wang, W.W.",
        TITLE = "Local Information Assisted Attention-Free Decoder for Audio
Captioning",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "1604-1608",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372954"}

@article{bb378862,
        AUTHOR = "Perochon, S.",
        TITLE = "A Presentation and Short Discussion of rVAD-fast, a Fast Voice
Activity Detector",
        JOURNAL = IPOL,
        VOLUME = "12",
        YEAR = "2022",
        PAGES = "404-419",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372955"}

@article{bb378863,
        AUTHOR = "Huang, H.J. and Huang, P.J. and Zhu, Z.B. and Li, J. and Lin, P.",
        TITLE = "CLID: A Chunk-Level Intent Detection Framework for Multiple Intent
Spoken Language Understanding",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "2123-2127",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372956"}

@article{bb378864,
        AUTHOR = "Du, X. and Pun, C.M.",
        TITLE = "Robust Audio Patch Attacks Using Physical Sample Simulation and
Adversarial Patch Noise Generation",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "4381-4393",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372957"}

@article{bb378865,
        AUTHOR = "Kim, H. and Park, J. and Lee, J.W.",
        TITLE = "Generating Transferable Adversarial Examples for Speech
Classification",
        JOURNAL = PR,
        VOLUME = "137",
        YEAR = "2023",
        PAGES = "109286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372958"}

@article{bb378866,
        AUTHOR = "Wei, G.Y. and Duan, Z.K. and Li, S. and Yu, X.M. and Yang, G.G.",
        TITLE = "LFEformer: Local Feature Enhancement Using Sliding Window With
Deformability for Automatic Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "180-184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372959"}

@article{bb378867,
        AUTHOR = "Xiao, F.Y. and Guan, J. and Zhu, Q. and Wang, W.W.",
        TITLE = "Graph Attention for Automated Audio Captioning",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "413-417",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372960"}

@article{bb378868,
        AUTHOR = "Chang, C.M. and Lee, C.C.",
        TITLE = "Learning Enhanced Acoustic Latent Representation for Small Scale
Affective Corpus with Adversarial Cross Corpora Integration",
        JOURNAL = AffCom,
        VOLUME = "14",
        YEAR = "2023",
        NUMBER = "2",
        MONTH = "April",
        PAGES = "1308-1321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372961"}

@article{bb378869,
        AUTHOR = "Qu, H.L. and Su, X.D. and Wang, Y. and Hao, X. and Gao, G.L.",
        TITLE = "Noise-Separated Adaptive Feature Distillation for Robust Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "763-767",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372962"}

@article{bb378870,
        AUTHOR = "Nga, C.H. and Vu, D.Q. and Luong, H.H. and Huang, C.L. and Wang, J.C.",
        TITLE = "Cyclic Transfer Learning for Mandarin-English Code-Switching Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "1387-1391",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372963"}

@article{bb378871,
        AUTHOR = "Dong, F. and Qian, Y.Y. and Wang, T.L. and Liu, P. and Cao, J.W.",
        TITLE = "A Transformer-Based End-to-End Automatic Speech Recognition Algorithm",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "1592-1596",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372964"}

@article{bb378872,
        AUTHOR = "Fan, P. and Shan, C.H. and Sun, S.N. and Yang, Q. and Zhang, J.W.",
        TITLE = "Key Frame Mechanism for Efficient Conformer Based End-to-End Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "1612-1616",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372965"}

@article{bb378873,
        AUTHOR = "Mahmoudi, H. and Camboim, S. and Brovelli, M.A.",
        TITLE = "Development of a Voice Virtual Assistant for the Geospatial Data
Visualization Application on the Web",
        JOURNAL = IJGI,
        VOLUME = "12",
        YEAR = "2023",
        NUMBER = "11",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372966"}

@article{bb378874,
        AUTHOR = "Vitolo, P. and Liguori, R. and di Benedetto, L. and Rubino, A. and Licciardo, G.D.",
        TITLE = "Automatic Audio Feature Extraction for Keyword Spotting",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "161-165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372967"}

@article{bb378875,
        AUTHOR = "Li, J.H. and Duan, Z.K. and Li, S. and Yu, X.M. and Yang, G.G.",
        TITLE = "ESAformer: Enhanced Self-Attention for Automatic Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "471-475",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372968"}

@article{bb378876,
        AUTHOR = "Nie, W.Z. and Bao, Y. and Zhao, Y. and Liu, A.",
        TITLE = "Long Dialogue Emotion Detection Based on Commonsense Knowledge Graph
Guidance",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "514-528",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372969"}

@article{bb378877,
        AUTHOR = "Sun, T.L. and Chen, H.N. and Hu, G.S. and He, L.H. and Zhao, C.R.",
        TITLE = "Explainability of Speech Recognition Transformers via Gradient-Based
Attention Visualization",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "1395-1406",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372970"}

@article{bb378878,
        AUTHOR = "Jacobs, C. and Kamper, H.",
        TITLE = "Leveraging Multilingual Transfer for Unsupervised Semantic Acoustic
Word Embeddings",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "311-315",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372971"}

@article{bb378879,
        AUTHOR = "Wang, F.Y. and Xu, B. and Xu, B.",
        TITLE = "SSCFormer: Push the Limit of Chunk-Wise Conformer for Streaming ASR
Using Sequentially Sampled Chunks and Chunked Causal Convolution",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "421-425",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372972"}

@article{bb378880,
        AUTHOR = "Fan, R. and Shankar, N.B. and Alwan, A.",
        TITLE = "UniEnc-CASSNAT: An Encoder-Only Non-Autoregressive ASR for Speech SSL
Models",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "711-715",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372973"}

@article{bb378881,
        AUTHOR = "Xing, B. and Tsang, I.W.",
        TITLE = "Co-Guiding for Multi-Intent Spoken Language Understanding",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "2965-2980",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372974"}

@article{bb378882,
        AUTHOR = "Hwang, K. and Jung, I.H. and Lee, J.M.",
        TITLE = "An implementation of searchable video player",
        JOURNAL = IJCVR,
        VOLUME = "14",
        YEAR = "2024",
        NUMBER = "3",
        PAGES = "325-337",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372975"}

@article{bb378883,
        AUTHOR = "Ma, Y.K. and Zhang, C. and Chen, Q. and Wang, W. and Ma, B.",
        TITLE = "Tuning Large Language Model for Speech Recognition With Mixed-Scale
Re-Tokenization",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "1740-1744",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372976"}

@article{bb378884,
        AUTHOR = "Mu, B.S. and Wan, X. and Zheng, N. and Zhou, H. and Xie, L.",
        TITLE = "MMGER: Multi-Modal and Multi-Granularity Generative Error Correction
With LLM for Joint Accent and Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "1940-1944",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372977"}

@article{bb378885,
        AUTHOR = "Shi, Y. and Li, L. and Wang, D. and Han, J.Q.",
        TITLE = "Keyword Guided Target Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "1945-1949",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372978"}

@article{bb378886,
        AUTHOR = "Gao, X.X. and Li, Z.X. and Chen, Y.M. and Liu, C. and Li, H.Z.",
        TITLE = "Transferable Adversarial Attacks Against ASR",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2200-2204",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372979"}

@article{bb378887,
        AUTHOR = "Lu, H. and Cheng, G.F. and Yan, Y.H.",
        TITLE = "Conversational Short-Phrase Speaker Diarization via Self-Adjusting
Speech Segmentation and Embedding Extraction",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2340-2344",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372980"}

@article{bb378888,
        AUTHOR = "Lee, C.W. and Lee, J.H. and Chang, J.H.",
        TITLE = "Language Model Personalization for Speech Recognition: A Clustered
Federated Learning Approach With Adaptive Weight Average",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2710-2714",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372981"}

@article{bb378889,
        AUTHOR = "Xing, B. and Tsang, I.W.",
        TITLE = "HC2L: Hybrid and Cooperative Contrastive Learning for Cross-Lingual
Spoken Language Understanding",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "8094-8105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372982"}

@article{bb378890,
        AUTHOR = "Chang, X. and Guo, P.C. and Fujita, Y. and Maekaku, T. and Watanabe, S.",
        TITLE = "MC-Whisper: Extending Speech Foundation Models to Multichannel
Distant Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2850-2854",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372983"}

@article{bb378891,
        AUTHOR = "Chen, Y.Q. and Niu, T. and Zhang, H. and Zhang, W. and Qu, D.",
        TITLE = "Meta-Prompt: Boosting Whisper's Performance in Low-Resource Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "3039-3043",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372984"}

@article{bb378892,
        AUTHOR = "Zheng, L. and Zhu, H. and Tian, S. and Zhao, Q.W. and Li, T.",
        TITLE = "Unsupervised Domain Adaptation on End-to-End Multi-Talker Overlapped
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "3119-3123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372985"}

@article{bb378893,
        AUTHOR = "Lee, H. and Yoon, J.W. and Kim, S.S. and Kim, N.S.",
        TITLE = "Towards Maximum Likelihood Training for Transducer-Based Streaming
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "26-30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372986"}

@article{bb378894,
        AUTHOR = "Zhuang, X. and Qian, Y.K. and Wang, M.J.",
        TITLE = "Hypformer: A Fast Hypothesis-Driven Rescoring Speech Recognition
Framework",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "471-475",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372987"}

@article{bb378895,
        AUTHOR = "Akman, A. and Sun, Q. and Schuller, B.W.",
        TITLE = "Improving Audio Explanations Using Audio Language Models",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "741-745",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372988"}

@article{bb378896,
        AUTHOR = "Liu, Y.P. and Yang, X. and Zhang, J.Y. and Xi, Y.L. and Qu, D.",
        TITLE = "TAML-Adapter: Enhancing Adapter Tuning Through Task-Agnostic
Meta-Learning for Low-Resource Automatic Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "636-640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372989"}

@article{bb378897,
        AUTHOR = "Kumar, K.V. and Rao, R.R.",
        TITLE = "An approach for speaker diarisation using whale-anti coronavirus
optimisation integrated deep fuzzy clustering",
        JOURNAL = IJCVR,
        VOLUME = "15",
        YEAR = "2025",
        NUMBER = "2",
        PAGES = "177-197",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372990"}

@article{bb378898,
        AUTHOR = "Kim, T.Y. and Yang, J.F. and Park, E.",
        TITLE = "MSDLF-K: A Multimodal Feature Learning Approach for Sentiment
Analysis in Korean Incorporating Text and Speech",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "1266-1276",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372991"}

@article{bb378899,
        AUTHOR = "Zhang, W.J. and Xia, Z.H. and Ma, B. and Yan, D.",
        TITLE = "Paradoxical Role of Adversarial Attacks: Enabling Crosslinguistic
Attacks and Information Hiding in Multilingual Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "1046-1050",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT372992"}
Last update:May 24, 2026 at 14:46:09