@article{bb379300,
AUTHOR = "Chee, K.Y. and Jin, Z. and Cai, D. and Li, M. and Yap, W.S. and Lai, Y.L. and Goi, B.M.",
TITLE = "Cancellable speech template via random binary orthogonal matrices
projection hashing",
JOURNAL = PR,
VOLUME = "76",
YEAR = "2018",
NUMBER = "1",
PAGES = "273-287",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373393"}
@article{bb379301,
AUTHOR = "Bernardini, A. and Antonacci, F. and Sarti, A.",
TITLE = "Wave Digital Implementation of Robust First-Order Differential
Microphone Arrays",
JOURNAL = SPLetters,
VOLUME = "25",
YEAR = "2018",
NUMBER = "2",
MONTH = "February",
PAGES = "253-257",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373394"}
@article{bb379302,
AUTHOR = "Liu, Q. and Wang, W. and de Campos, T.E. and Jackson, P.J.B. and Hilton, A.",
TITLE = "Multiple Speaker Tracking in Spatial Audio via PHD Filtering and
Depth-Audio Fusion",
JOURNAL = MultMed,
VOLUME = "20",
YEAR = "2018",
NUMBER = "7",
MONTH = "July",
PAGES = "1767-1780",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373395"}
@article{bb379303,
AUTHOR = "Lu, R. and Duan, Z. and Zhang, C.",
TITLE = "Listen and Look: Audio-Visual Matching Assisted Speech Source
Separation",
JOURNAL = SPLetters,
VOLUME = "25",
YEAR = "2018",
NUMBER = "9",
MONTH = "September",
PAGES = "1315-1319",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373396"}
@article{bb379304,
AUTHOR = "Wu, K.B. and Zhang, D. and Lu, G.M. and Guo, Z.H.",
TITLE = "Joint learning for voice based disease detection",
JOURNAL = PR,
VOLUME = "87",
YEAR = "2019",
PAGES = "130-139",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373397"}
@article{bb379305,
AUTHOR = "Kumar, R.K. and Birla, L. and Rao, K.S.",
TITLE = "A robust unsupervised pattern discovery and clustering of speech
signals",
JOURNAL = PRL,
VOLUME = "116",
YEAR = "2018",
PAGES = "254-261",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373398"}
@inproceedings{bb379306,
AUTHOR = "Gong, C. and Yi, X.W. and Zhao, X.F.",
TITLE = "Pitch Delay Based Adaptive Steganography for AMR Speech Stream",
BOOKTITLE = IWDW18,
YEAR = "2018",
PAGES = "275-289",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373399"}
@article{bb379307,
AUTHOR = "Skovranek, T. and Despotovic, V. and Peric, Z.",
TITLE = "Optimal Fractional Linear Prediction With Restricted Memory",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "5",
MONTH = "May",
PAGES = "760-764",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373400"}
@article{bb379308,
AUTHOR = "Zhang, J. and Koutrouvelis, A.I. and Heusdens, R. and Hendriks, R.C.",
TITLE = "Distributed Rate-Constrained LCMV Beamforming",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "5",
MONTH = "May",
PAGES = "675-679",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373401"}
@article{bb379309,
AUTHOR = "Keerthana, Y.M. and Reddy, M.K. and Rao, K.S.",
TITLE = "CWT-Based Approach for Epoch Extraction From Telephone Quality Speech",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "8",
MONTH = "August",
PAGES = "1107-1111",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373402"}
@article{bb379310,
AUTHOR = "Gurugubelli, K. and Vuppala, A.K.",
TITLE = "Stable Implementation of Zero Frequency Filtering of Speech Signals
for Efficient Epoch Extraction",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "9",
MONTH = "September",
PAGES = "1310-1314",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373403"}
@article{bb379311,
AUTHOR = "Deb, S. and Dandapat, S.",
TITLE = "Emotion Classification Using Segmentation of Vowel-Like and
Non-Vowel-Like Regions",
JOURNAL = AffCom,
VOLUME = "10",
YEAR = "2019",
NUMBER = "3",
MONTH = "July",
PAGES = "360-373",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373404"}
@article{bb379312,
AUTHOR = "Kotropoulos, C.L.",
TITLE = "Source phone identification using sketches of features",
JOURNAL = IET-Bio,
VOLUME = "3",
YEAR = "2014",
NUMBER = "2",
MONTH = "June",
PAGES = "75-83",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373405"}
@article{bb379313,
AUTHOR = "Rajan, V. and Brutti, A. and Cavallaro, A.",
TITLE = "ConflictNET: End-to-End Learning for Speech-Based Conflict Intensity
Estimation",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "11",
MONTH = "November",
PAGES = "1668-1672",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373406"}
@article{bb379314,
AUTHOR = "Lotfian, R. and Busso, C.",
TITLE = "Building Naturalistic Emotionally Balanced Speech Corpus by
Retrieving Emotional Speech from Existing Podcast Recordings",
JOURNAL = AffCom,
VOLUME = "10",
YEAR = "2019",
NUMBER = "4",
MONTH = "October",
PAGES = "471-483",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373407"}
@article{bb379315,
AUTHOR = "Lee, Y. and Min, J. and Han, D.K. and Ko, H.",
TITLE = "Spectro-Temporal Attention-Based Voice Activity Detection",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "131-135",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373408"}
@article{bb379316,
AUTHOR = "Lim, H. and Kim, Y. and Goo, J. and Kim, H.",
TITLE = "Interlayer Selective Attention Network for Robust Personalized
Wake-Up Word Detection",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "126-130",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373409"}
@article{bb379317,
AUTHOR = "Yang, H. and Yang, Z. and Bao, Y. and Liu, S. and Huang, Y.",
TITLE = "Fast Steganalysis Method for VoIP Streams",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "286-290",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373410"}
@inproceedings{bb379318,
AUTHOR = "Zhang, L.W. and Shi, Z.Q. and Han, J.Q. and Shi, A. and Ma, D.",
TITLE = "Furcanext: End-to-end Monaural Speech Separation with Dynamic Gated
Dilated Temporal Convolutional Networks",
BOOKTITLE = MMMod20,
YEAR = "2020",
PAGES = "I:653-665",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373411"}
@article{bb379319,
AUTHOR = "Lin, X. and Zhu, J. and Chen, D.",
TITLE = "Subband Aware CNN for Cell-Phone Recognition",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "605-609",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373412"}
@article{bb379320,
AUTHOR = "Tagliasacchi, M. and Gfeller, B. and Quitry, F.d.C. and Roblek, D.",
TITLE = "Pre-Training Audio Representations With Self-Supervision",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "600-604",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373413"}
@article{bb379321,
AUTHOR = "Yatabe, K.",
TITLE = "Consistent ICA: Determined BSS Meets Spectrogram Consistency",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "870-874",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373414"}
@article{bb379322,
AUTHOR = "Muralishankar, R. and Ghosh, D. and Gurugopinath, S.",
TITLE = "A Novel Modified Mel-DCT Filter Bank Structure With Application to
Voice Activity Detection",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "1240-1244",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373415"}
@article{bb379323,
AUTHOR = "Jiang, F. and Duan, Z.",
TITLE = "Speaker Attractor Network: Generalizing Speech Separation to Unseen
Numbers of Sources",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "1859-1863",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373416"}
@article{bb379324,
AUTHOR = "Kim, J. and Lee, Y. and Kim, E.",
TITLE = "Accelerating RNN Transducer Inference via Adaptive Expansion Search",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "2019-2023",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373417"}
@article{bb379325,
AUTHOR = "Janbakhshi, P. and Kodrasi, I. and Bourlard, H.",
TITLE = "Subspace-Based Learning for Automatic Dysarthric Speech Detection",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "96-100",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373418"}
@article{bb379326,
AUTHOR = "Gimeno, P. and Mingote, V. and Ortega, A. and Miguel, A. and Lleida, E.",
TITLE = "Generalizing AUC Optimization to Multiclass Classification for Audio
Segmentation With Limited Training Data",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1135-1139",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373419"}
@article{bb379327,
AUTHOR = "Queiroz, A. and Coelho, R.",
TITLE = "F0-Based Gammatone Filtering for Intelligibility Gain of Acoustic
Noisy Signals",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1225-1229",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373420"}
@article{bb379328,
AUTHOR = "Vrbik, D. and Labus, V.",
TITLE = "Crowdsourcing of Popular Toponyms: How to Collect and Preserve
Toponyms in Spoken Use",
JOURNAL = IJGI,
VOLUME = "10",
YEAR = "2021",
NUMBER = "5",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373421"}
@article{bb379329,
AUTHOR = "Ikeshita, R. and Kinoshita, K. and Kamo, N. and Nakatani, T.",
TITLE = "Online Speech Dereverberation Using Mixture of Multichannel Linear
Prediction Models",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1580-1584",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373422"}
@article{bb379330,
AUTHOR = "Jiang, Y.C. and Leung, F.H.F.",
TITLE = "Vector-Based Feature Representations for Speech Signals:
From Supervector to Latent Vector",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "2641-2655",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373423"}
@article{bb379331,
AUTHOR = "Esmaeilpour, M. and Cardinal, P. and Koerich, A.L.",
TITLE = "Cyclic Defense GAN Against Speech Adversarial Attacks",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1769-1773",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373424"}
@article{bb379332,
AUTHOR = "Kodrasi, I.",
TITLE = "Temporal Envelope and Fine Structure Cues for Dysarthric Speech
Detection Using CNNs",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1853-1857",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373425"}
@article{bb379333,
AUTHOR = "Ikeshita, R. and Kamo, N. and Nakatani, T.",
TITLE = "Blind Signal Dereverberation Based on Mixture of Weighted Prediction
Error Models",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "399-403",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373426"}
@article{bb379334,
AUTHOR = "Liu, Z.T. and Rehman, A. and Wu, M. and Cao, W.H. and Hao, M.",
TITLE = "Speech Personality Recognition Based on Annotation Classification
Using Log-Likelihood Distance and Extraction of Essential Audio
Features",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "3414-3426",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373427"}
@article{bb379335,
AUTHOR = "Kim, H.Y. and Yoon, J.W. and Cho, W.I. and Kim, N.S.",
TITLE = "Neurally Optimized Decoder for Low Bitrate Speech Codec",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "244-248",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373428"}
@article{bb379336,
AUTHOR = "Cohen, E. and Kreuk, F. and Keshet, J.",
TITLE = "Speech Time-Scale Modification With GANs",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1067-1071",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373429"}
@article{bb379337,
AUTHOR = "Choi, J. and Chang, J.H.",
TITLE = "Supervised Learning Approach for Explicit Spatial Filtering of Speech",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1412-1416",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373430"}
@article{bb379338,
AUTHOR = "Fu, M.J. and Wang, X.M. and Wang, J.",
TITLE = "Polynomial-Decomposition-Based LPC for Formant Estimation",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1392-1396",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373431"}
@article{bb379339,
AUTHOR = "Kim, M.S. and Kim, H.S.",
TITLE = "Attentive Pooling-Based Weighted Sum of Spectral Decay Rates for
Blind Estimation of Reverberation Time",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1639-1643",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373432"}
@article{bb379340,
AUTHOR = "Reddy, M.K. and Keerthana, Y.M. and Alku, P.",
TITLE = "End-to-End Pathological Speech Detection Using Wavelet Scattering
Network",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1863-1867",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373433"}
@article{bb379341,
AUTHOR = "Karamatli, E. and Kirbiz, S.",
TITLE = "MixCycle: Unsupervised Speech Separation via Cyclic Mixture
Permutation Invariant Training",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "2637-2641",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373434"}
@article{bb379342,
AUTHOR = "McKinney, A.F. and Cauchi, B.",
TITLE = "Non-Intrusive Binaural Speech Intelligibility Prediction From
Discrete Latent Representations",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "987-991",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373435"}
@article{bb379343,
AUTHOR = "de Lacerda Pataca, C. and Costa, P.D.P.",
TITLE = "Hidden Bawls, Whispers, and Yelps:
Can Text Convey the Sound of Speech, Beyond Words?",
JOURNAL = AffCom,
VOLUME = "14",
YEAR = "2023",
NUMBER = "1",
MONTH = "January",
PAGES = "6-16",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373436"}
@article{bb379344,
AUTHOR = "Chen, G. and Li, X.G. and Xiao, S.Y. and Zhang, C.H. and Lu, X.H.",
TITLE = "RACL: A robust adaptive contrastive learning method for
conversational satisfaction prediction",
JOURNAL = PR,
VOLUME = "138",
YEAR = "2023",
PAGES = "109386",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373437"}
@article{bb379345,
AUTHOR = "Cheng, J.M. and Liang, R. and Zhao, L. and Huang, C.W. and Schuller, B.W.",
TITLE = "Speech Denoising and Compensation for Hearing Aids Using an
FTCRN-Based Metric GAN",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "374-378",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373438"}
@article{bb379346,
AUTHOR = "Shu, Y.C. and Luo, H.N. and Zhang, S.L. and Wang, L.B. and Dang, J.W.",
TITLE = "A CIF-Based Speech Segmentation Method for Streaming E2E ASR",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "344-348",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373439"}
@article{bb379347,
AUTHOR = "Zhou, Y. and Wu, Z.Z. and Zhang, M.Y. and Tian, X.H. and Li, H.Z.",
TITLE = "TTS-Guided Training for Accent Conversion Without Parallel Data",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "533-537",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373440"}
@article{bb379348,
AUTHOR = "Koepke, A.S. and Oncescu, A.M. and Henriques, J.F. and Akata, Z. and Albanie, S.",
TITLE = "Audio Retrieval With Natural Language Queries: A Benchmark Study",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "2675-2685",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373441"}
@article{bb379349,
AUTHOR = "Park, D. and Yu, Y. and Katabi, D. and Kim, H.K.",
TITLE = "Adversarial Continual Learning to Transfer Self-Supervised Speech
Representations for Voice Pathology Detection",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "932-936",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373442"}
@article{bb379350,
AUTHOR = "Kim, H. and Shin, J.W.",
TITLE = "On Training Speech Separation Models With Various Numbers of Speakers",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "1202-1206",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373443"}
@article{bb379351,
AUTHOR = "Joglekar, A. and Hansen, J.H.L.",
TITLE = "DeepComboSAD: Spectro-Temporal Correlation Based Speech Activity
Detection for Naturalistic Audio Streams",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "1472-1476",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373444"}
@article{bb379352,
AUTHOR = "Cai, Y.Q. and Li, L. and Abel, A. and Zhu, X.Y. and Wang, D.",
TITLE = "Maximum Gaussianality training for deep speaker vector normalization",
JOURNAL = PR,
VOLUME = "145",
YEAR = "2024",
PAGES = "109977",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373445"}
@article{bb379353,
AUTHOR = "Raman, C. and Prabhu, N.R. and Hung, H.",
TITLE = "Perceived Conversation Quality in Spontaneous Interactions",
JOURNAL = AffCom,
VOLUME = "14",
YEAR = "2023",
NUMBER = "4",
MONTH = "October",
PAGES = "2901-2912",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373446"}
@inproceedings{bb379354,
AUTHOR = "Atito, S. and Awais, M. and Alex, T. and Kittler, J.V.",
TITLE = "Group Masked Model Learning for General Audio Representation",
BOOKTITLE = ICIP23,
YEAR = "2023",
PAGES = "2600-2604",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373447"}
@article{bb379355,
AUTHOR = "Lee, H. and Saeed, A.",
TITLE = "Distilled non-semantic speech embeddings with binary neural networks
for low-resource devices",
JOURNAL = PRL,
VOLUME = "177",
YEAR = "2024",
PAGES = "15-19",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373448"}
@article{bb379356,
AUTHOR = "Ye, L.X. and Gao, C.F. and Cheng, G.F. and Luo, L.P. and Zhao, Q.W.",
TITLE = "ASQ: An Ultra-Low Bit Rate ASR-Oriented Speech Quantization Method",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "221-225",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373449"}
@article{bb379357,
AUTHOR = "Li, C.T. and Yang, F. and Yang, J.",
TITLE = "Restoration of Bone-Conducted Speech With U-Net-Like Model and Energy
Distance Loss",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "166-170",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373450"}
@article{bb379358,
AUTHOR = "Rababaah, A.R.",
TITLE = "Intelligent classification model for holy Quran recitation Maqams",
JOURNAL = IJCVR,
VOLUME = "14",
YEAR = "2024",
NUMBER = "2",
PAGES = "170-190",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373451"}
@article{bb379359,
AUTHOR = "Muraleedharan, K.M. and Kumar, K.T.B. and John, S.I. and Kumar, R.K. .S.I.",
TITLE = "Combined Use of Nonlinear Measures for Analyzing Pathological Voices",
JOURNAL = IJIG,
VOLUME = "24",
YEAR = "2024",
NUMBER = "3",
MONTH = "May",
PAGES = "2450035",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373452"}
@article{bb379360,
AUTHOR = "Wang, Z.Q.",
TITLE = "Mixture to Mixture: Leveraging Close-Talk Mixtures as
Weak-Supervision for Speech Separation",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "1715-1719",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373453"}
@article{bb379361,
AUTHOR = "Zhang, C. and Jiang, S.",
TITLE = "Detection of QIM-Based Steganography in VoIP Streams:
A MobileViT-Inspired Model",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "1735-1739",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373454"}
@article{bb379362,
AUTHOR = "Wang, Z.C. and Chen, Y.Z. and Wang, X.S. and Xie, L. and Wang, Y.P.",
TITLE = "StreamVoice+: Evolving Into End-to-End Streaming Zero-Shot Voice
Conversion",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "3000-3004",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373455"}
@article{bb379363,
AUTHOR = "Guo, N. and Edler, B.",
TITLE = "Frequency Domain Prediction of Tonal Signals With Time-Varying
Pitches",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "31-35",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373456"}
@article{bb379364,
AUTHOR = "Lopez Espejo, I. and Rosello, E. and Edraki, A. and Harte, N. and Jensen, J.",
TITLE = "Noise-Robust Hearing Aid Voice Control",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "241-245",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373457"}
@article{bb379365,
AUTHOR = "Xie, H. and Khorrami, K. and Rasanen, O. and Virtanen, T.",
TITLE = "Text-Based Audio Retrieval by Learning From Similarities Between
Audio Captions",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "221-225",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373458"}
@article{bb379366,
AUTHOR = "Yuan, C.S. and Chen, Y.F. and Zhou, Z. and Xia, Z.H. and Huang, Y.F.",
TITLE = "Compressed Domain Invariant Adversarial Representation Learning for
Robust Audio Deepfake Detection",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1111-1115",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373459"}
@article{bb379367,
AUTHOR = "Unoki, M. and Li, K. and Chaiwongyen, A. and Nguyen, Q.H. and Zaman, K.",
TITLE = "Deepfake Speech Detection: Approaches from Acoustic Features to Deep
Neural Networks",
JOURNAL = IEICE,
VOLUME = "E108-D",
YEAR = "2025",
NUMBER = "4",
MONTH = "April",
PAGES = "300-310",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373460"}
@article{bb379368,
AUTHOR = "Shin, U.H. and Ku, B.H. and Park, H.M.",
TITLE = "TF-CorrNet: Leveraging Spatial Correlation for Continuous Speech
Separation",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1875-1879",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373461"}
@article{bb379369,
AUTHOR = "Ta, B.T. and Le, N.M. and Binh, H.T.T. and Do, V.H.",
TITLE = "Exploring Non-Matching Multiple References for Speech Quality
Assessment",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1610-1614",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373462"}
@article{bb379370,
AUTHOR = "Jin, L.B. and Min, D. and Yu, C. and Shin, J.E. and Kim, E.Y.",
TITLE = "Detecting Hearing Impairment Through Localizing Abnormal Speech
Patterns",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "1945-1949",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373463"}
@article{bb379371,
AUTHOR = "Liu, D. and Zhang, T.Q. and Wei, Y. and Yi, C. and Christensen, M.G.",
TITLE = "Speech Conv-Mamba: Selective Structured State Space Model With
Temporal Dilated Convolution for Efficient Speech Separation",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "2015-2019",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373464"}
@article{bb379372,
AUTHOR = "Liu, F. and Ai, Y. and Ling, Z.H.",
TITLE = "Token-Prediction-Based Post-Processing for Low-Bitrate Speech Coding",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3235-3239",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373465"}
@article{bb379373,
AUTHOR = "Zhang, Z.X. and Xu, W.X. and Dong, Z. and Wang, K.L. and Wu, Y.M. and Peng, J. and Wang, R. and Huang, D.Y.",
TITLE = "ParaLBench: A Large-Scale Benchmark for Computational Paralinguistics
Over Acoustic Foundation Models",
JOURNAL = AffCom,
VOLUME = "16",
YEAR = "2025",
NUMBER = "3",
MONTH = "July",
PAGES = "1290-1306",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373466"}
@article{bb379374,
AUTHOR = "Yang, Y. and Zhou, C.",
TITLE = "DPARNet-RSE: Toward Angular Region-Customizable Speech Extraction",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3779-3783",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373467"}
@article{bb379375,
AUTHOR = "Zhao, Z.Y. and Peng, Y. and Camilleri, K. and Kong, W.Z. and Cichocki, A.",
TITLE = "Imagined Speech Decoding by Learning Consensus Graph From RKHS-Based
Multi-View EEG Features",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "3944-3948",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373468"}
@article{bb379376,
AUTHOR = "Tan, Z.W. and Reju, V.G. and Tewari, R.C. and Ding, R.T. and Khong, A.W.H.",
TITLE = "Joint Enhancement and Bandwidth Extension for Radar Through-Barrier
Speech Acquisition",
JOURNAL = SPLetters,
VOLUME = "33",
YEAR = "2026",
PAGES = "176-180",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373469"}
@article{bb379377,
AUTHOR = "Fu, R. and Tang, L. and Tian, H. and Chang, C.C.",
TITLE = "Fuzzy-Clustering-Based Domain Adaptation for Speech Steganalysis in
Dynamic Scenarios",
JOURNAL = SPLetters,
VOLUME = "33",
YEAR = "2026",
PAGES = "366-370",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373470"}
@article{bb379378,
AUTHOR = "Wang, T. and Yi, J.Y. and Fu, R. and Qiang, C.Y. and Chong, D. and Wang, C. and Dai, D.Y. and Wen, Z.Q. and Tao, J.H.",
TITLE = "SpeechPalette: A Comprehensive Speech Editing Method for Text-Based
Speech Editing, One-Shot TTS and Attributes Editing",
JOURNAL = PAMI,
VOLUME = "48",
YEAR = "2026",
NUMBER = "3",
MONTH = "March",
PAGES = "2596-2609",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373471"}
@article{bb379379,
AUTHOR = "Hu, H.Q. and Liao, Y. and Cai, S.Q. and Li, H.Z.",
TITLE = "The effect of speech representations on EEG-based auditory attention
detection",
JOURNAL = PRL,
VOLUME = "203",
YEAR = "2026",
PAGES = "146-151",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373472"}
@article{bb379380,
AUTHOR = "Kim, D. and Jung, S.K.",
TITLE = "Bin-Wise Zone-Based Speech Presence Detection With Metric-Aligned DCF
Optimization",
JOURNAL = SPLetters,
VOLUME = "33",
YEAR = "2026",
PAGES = "1471-1475",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373473"}
@inproceedings{bb379381,
AUTHOR = "Wani, T.M. and Amerini, I.",
TITLE = "Deepfakes Audio Detection Leveraging Audio Spectrogram and
Convolutional Neural Networks",
BOOKTITLE = CIAP23,
YEAR = "2023",
PAGES = "II:156-167",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373474"}
@inproceedings{bb379382,
AUTHOR = "Choi, S. and Oh, S. and Yang, J. and Lee, Y. and Kwak, I.Y.",
TITLE = "Light-weight Frequency Information Aware Neural Network Architecture
for Voice Spoofing Detection",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "477-483",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373475"}
@inproceedings{bb379383,
AUTHOR = "Li, X. and Hu, X. and Chen, X. and Pan, H. and Niu, K.",
TITLE = "Deep Speaker Embedding Using Hybrid Network of Multi-Feature
Aggregation and Multi-Loss Fusion for TI-SV",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "506-512",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373476"}
@inproceedings{bb379384,
AUTHOR = "Zhang, B. and Sim, T.",
TITLE = "Localizing Fake Segments in Speech",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "3224-3230",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373477"}
@inproceedings{bb379385,
AUTHOR = "Teng, Z.W. and Fu, Q. and White, J. and Powell, M.E. and Schmidt, D.C.",
TITLE = "ARawNet: A Lightweight Solution for Leveraging Raw Waveforms in Spoof
Speech Detection",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "692-698",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373478"}
@inproceedings{bb379386,
AUTHOR = "Stefanov, K. and Adiban, M. and Salvi, G.",
TITLE = "Spatial Bias in Vision-Based Voice Activity Detection",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "10433-10440",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373479"}
@inproceedings{bb379387,
AUTHOR = "Barros, F. and Conde, A. and Soares, S.C. and Neves, A.J.R. and Silva, S.",
TITLE = "Understanding Public Speakers' Performance:
First Contributions to Support a Computational Approach",
BOOKTITLE = ICIAR20,
YEAR = "2020",
PAGES = "I:343-355",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373480"}
@inproceedings{bb379388,
AUTHOR = "Bilkova, Z. and Novozamsky, A. and Dominec, A. and Gresko, S. and Zitova, B. and Paroubkova, M.",
TITLE = "Automatic Evaluation of Speech Therapy Exercises Based on Image Data",
BOOKTITLE = ICIAR19,
YEAR = "2019",
PAGES = "I:397-404",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373481"}
@inproceedings{bb379389,
AUTHOR = "Dai, J.J. and Dixon, S.",
TITLE = "Understanding Intonation Trajectories and Patterns of Vocal Notes",
BOOKTITLE = "MMMod19",
YEAR = "2019",
PAGES = "II:243-253",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373482"}
@inproceedings{bb379390,
AUTHOR = "Zheng, S. and Wang, J. and Xiao, J. and Hsu, W. and Glass, J.",
TITLE = "A Noise-Robust Self-Adaptive Multitarget Speaker Detection System",
BOOKTITLE = ICPR18,
YEAR = "2018",
PAGES = "1068-1072",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373483"}
@inproceedings{bb379391,
AUTHOR = "Athanasopoulos, G. and Hagihara, K. and Cierro, A. and Guerit, R. and Chatelain, J. and Lucas, C. and Macq, B.",
TITLE = "3D immersive karaoke for the learning of foreign language
pronunciation",
BOOKTITLE = IC3D17,
YEAR = "2017",
PAGES = "1-8",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373484"}
@inproceedings{bb379392,
AUTHOR = "Serras, M. and Torres, M.I. and del Pozo, A.",
TITLE = "Online Learning of Attributed Bi-Automata for Dialogue Management in
Spoken Dialogue Systems",
BOOKTITLE = IbPRIA17,
YEAR = "2017",
PAGES = "22-31",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373485"}
@inproceedings{bb379393,
AUTHOR = "Nagpal, A. and Patil, H.A.",
TITLE = "Novel Gammatone Filterbank Based Spectro-Temporal Features for Robust
Phoneme Recognition",
BOOKTITLE = PReMI17,
YEAR = "2017",
PAGES = "342-350",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373486"}
@inproceedings{bb379394,
AUTHOR = "Grachev, A.M. and Ignatov, D.I. and Savchenko, A.V.",
TITLE = "Neural Networks Compression for Language Modeling",
BOOKTITLE = PReMI17,
YEAR = "2017",
PAGES = "351-357",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373487"}
@inproceedings{bb379395,
AUTHOR = "Zhang, L. and Chen, J.X. and Luo, Y. and Fu, J.F. and Ye, Z.F.",
TITLE = "Supervised single-channel speech dereverberation and denoising using
a two-stage processing",
BOOKTITLE = ICIVC17,
YEAR = "2017",
PAGES = "818-822",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373488"}
@inproceedings{bb379396,
AUTHOR = "Bedoui, A. and Ben Jebara, S.",
TITLE = "On the use of opening phase slopes of the glottal signal to
characterize unilateral vocal folds paralysis",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "41-46",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373489"}
@inproceedings{bb379397,
AUTHOR = "Ben Ali, F. and Djaziri Larbi, S.",
TITLE = "A very low bit rate codec for wide band speech based on a long-term
perceptual harmonic plus noise model",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "71-76",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373490"}
@inproceedings{bb379398,
AUTHOR = "Ferreira, A.",
TITLE = "Implantation of voicing on whispered speech using frequency-domain
parametric modelling of source and filter information",
BOOKTITLE = ISIVC16,
YEAR = "2016",
PAGES = "159-166",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373491"}
@inproceedings{bb379399,
AUTHOR = "Pozzebon, A. and Biliotti, F. and Calamai, S.",
TITLE = "Places Speaking with Their Own Voices. A Case Study from the Gra.fo
Archives",
BOOKTITLE = EuroMed16,
YEAR = "2016",
PAGES = "II: 232-239",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT373492"}
Last update:May 24, 2026 at 14:46:09