@inproceedings{bb335400, AUTHOR = "Li, C. and Zhu, L. and Xu, S. and Gao, P. and Xu, B.", TITLE = "Recurrent Neural Network Based Small-footprint Wake-up-word Speech Recognition System with a Score Calibration Method", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "3222-3227", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329698"} @inproceedings{bb335401, AUTHOR = "Li, C. and Zhu, L. and Xu, S. and Gao, P. and Xu, B.", TITLE = "Compression of Acoustic Model via Knowledge Distillation and Pruning", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "2785-2790", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329699"} @inproceedings{bb335402, AUTHOR = "Zhang, S. and Liu, W. and Qin, Y.", TITLE = "Wake-up-word spotting using end-to-end deep neural network system", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2878-2883", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329700"} @inproceedings{bb335403, AUTHOR = "Zhang, S.L. and Qin, Y.", TITLE = "Rapid feature space MLLR speaker adaptation for deep neural network acoustic modeling", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2889-2894", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329701"} @inproceedings{bb335404, AUTHOR = "Zheng, H. and Cai, W. and Zhou, T.Y. and Zhang, S.L. and Li, M.", TITLE = "Text-independent voice conversion using deep neural network based phonetic level features", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2872-2877", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329702"} @inproceedings{bb335405, AUTHOR = "Zhang, B. and Gan, Y.Q. and Song, Y. and Tang, B.L.", TITLE = "Application of pronunciation knowledge on phoneme recognition by LSTM neural network", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2906-2911", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329703"} @inproceedings{bb335406, AUTHOR = "Garcia, F. and Sanchis, E. and Hurtado, L.F. and Segarra, E.", TITLE = "Adaptive Training for Robust Spoken Language Understanding", BOOKTITLE = CIARP15, YEAR = "2015", PAGES = "519-526", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329704"} @inproceedings{bb335407, AUTHOR = "Pastor, J. and Hurtado, L.F. and Segarra, E. and Sanchis, E.", TITLE = "Language Modelization and Categorization for Voice-Activated QA", BOOKTITLE = CIARP11, YEAR = "2011", PAGES = "475-482", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329705"} @inproceedings{bb335408, AUTHOR = "Garcia, F. and Hurtado, L.F. and Sanchis, E. and Segarra, E.", TITLE = "An Active Learning Approach for Statistical Spoken Language Understanding", BOOKTITLE = CIARP11, YEAR = "2011", PAGES = "565-572", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329706"} @inproceedings{bb335409, AUTHOR = "Hurtado, L.F. and Griol, D. and Sanchis, E. and Segarra, E.", TITLE = "A Statistical User Simulation Technique for the Improvement of a Spoken Dialog System", BOOKTITLE = CIARP07, YEAR = "2007", PAGES = "743-752", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329707"} @inproceedings{bb335410, AUTHOR = "Griol, D. and Hurtado, L.F. and Segarra, E. and Sanchis, E.", TITLE = "A Dialog Management Methodology Based on Neural Networks and Its Application to Different Domains", BOOKTITLE = CIARP08, YEAR = "2008", PAGES = "643-650", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329708"} @inproceedings{bb335411, AUTHOR = "He, H.Y. and Wen, C.Y.", TITLE = "ART2-based multiple MLPs neural network for speaker-independent recognition of isolated words", BOOKTITLE = ICPR92, YEAR = "1992", PAGES = "II:590-593", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT329709"} @article{bb335412, AUTHOR = "de Mori, R. and Laface, P. and Makhonine, V.A. and Mezzalama, M.", TITLE = "A syntactic procedure for the recognition of glottal pulses in continuous speech", JOURNAL = PR, VOLUME = "9", YEAR = "1977", NUMBER = "4", PAGES = "181-189", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329710"} @article{bb335413, AUTHOR = "de Mori, R. and Giordano, G.", TITLE = "Algorithms for syllabic hypothesization in continuous speech", JOURNAL = PR, VOLUME = "14", YEAR = "1981", NUMBER = "1-6", PAGES = "245-260", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329711"} @article{bb335414, AUTHOR = "Pal, S.K. and Datta, A.K. and Majumder, D.D.", TITLE = "A self-supervised vowel recognition system", JOURNAL = PR, VOLUME = "12", YEAR = "1980", NUMBER = "1", PAGES = "27-34", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329712"} @article{bb335415, AUTHOR = "Pathak, A. and Pal, S.K.", TITLE = "On the convergence of 'A self-supervised vowel recognition system'", JOURNAL = PR, VOLUME = "20", YEAR = "1987", NUMBER = "2", PAGES = "237-244", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329713"} @article{bb335416, AUTHOR = "Howard, J.H.", TITLE = "Feature selection in human auditory perception", JOURNAL = PR, VOLUME = "15", YEAR = "1982", NUMBER = "5", PAGES = "397-403", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329714"} @article{bb335417, AUTHOR = "Thomason, M.G. and Granum, E. and Blake, R.E.", TITLE = "Experiments in dynamic programming inference of Markov networks with strings representing speech data", JOURNAL = PR, VOLUME = "19", YEAR = "1986", NUMBER = "5", PAGES = "343-352", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329715"} @article{bb335418, AUTHOR = "Tanaka, E. and Toyama, T. and Kawai, S.", TITLE = "High speed error correction of phoneme sequences", JOURNAL = PR, VOLUME = "19", YEAR = "1986", NUMBER = "5", PAGES = "407-412", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329716"} @article{bb335419, AUTHOR = "Hochberg, J. and Mniszewski, S.M. and Calleja, T. and Papcun, G.J.", TITLE = "A default hierarchy for pronouncing English", JOURNAL = PAMI, VOLUME = "13", YEAR = "1991", NUMBER = "9", MONTH = "September", PAGES = "957-964", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329717"} @article{bb335420, AUTHOR = "Carlson, B.A. and Clements, M.A.", TITLE = "A computationally compact divergence measure for speech processing", JOURNAL = PAMI, VOLUME = "13", YEAR = "1991", NUMBER = "12", MONTH = "December", PAGES = "1255-1260", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329718"} @article{bb335421, AUTHOR = "Tacer, B. and Loughlin, P.J.", TITLE = "Non-stationary signal classification using the joint moments of time-frequency distributions", JOURNAL = PR, VOLUME = "31", YEAR = "1998", NUMBER = "11", MONTH = "November", PAGES = "1635-1641", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329719"} @article{bb335422, AUTHOR = "Li, M. and McAllister, H.G. and Black, N.D. and de Perez, T.A.", TITLE = "Wavelet-based nonlinear AGC method for hearing aid loudness compensation", JOURNAL = VISP, VOLUME = "147", YEAR = "2000", NUMBER = "6", MONTH = "December", PAGES = "502-507", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329720"} @article{bb335423, AUTHOR = "Gray, P. and Hollier, M.P. and Massara, R.E.", TITLE = "Non-intrusive speech-quality assessment using vocal-tract models", JOURNAL = VISP, VOLUME = "147", YEAR = "2000", NUMBER = "6", MONTH = "December", PAGES = "493-501", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329721"} @article{bb335424, AUTHOR = "Sarkar, S. and Poor, H.V.", TITLE = "Multirate signal processing on finite fields", JOURNAL = VISP, VOLUME = "148", YEAR = "2001", NUMBER = "4", MONTH = "August", PAGES = "254-262", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329722"} @article{bb335425, AUTHOR = "Mumolo, E.", TITLE = "Spectral domain texture analysis for speech enhancement", JOURNAL = PR, VOLUME = "35", YEAR = "2002", NUMBER = "10", MONTH = "October", PAGES = "2181-2191", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329723"} @article{bb335426, AUTHOR = "Ding, Z.O. and McLoughlin, I.V. and Tan, E.C.", TITLE = "Extension of proposal of standards for intelligibility tests of Chinese speech: CDRT-tone", JOURNAL = VISP, VOLUME = "150", YEAR = "2003", NUMBER = "1", MONTH = "February", PAGES = "1-5", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329724"} @article{bb335427, AUTHOR = "de Lamare, R.C. and Alcaim, A.", TITLE = "Strategies to improve the performance of very low bit rate speech coders and application to a variable rate 1.2 kb/s codec", JOURNAL = VISP, VOLUME = "152", YEAR = "2005", NUMBER = "1", MONTH = "February", PAGES = "74-86", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329725"} @article{bb335428, AUTHOR = "Vera Candeas, P. and Ruiz Reyes, N. and Rosa Zurera, M. and Lopez Ferreras, F. and Curpian Alonso, J.", TITLE = "New matching pursuit based sinusoidal modelling method for audio coding", JOURNAL = VISP, VOLUME = "151", YEAR = "2004", NUMBER = "1", MONTH = "February", PAGES = "21-28", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329726"} @inproceedings{bb335429, AUTHOR = "Vera Candeas, P. and Ruiz Reyes, N. and Rosa Zurera, M. and Cuevas Martinez, J.C. and Lopez Ferreras, F.", TITLE = "Adaptive Signal Models for Wide-Band Speech and Audio Compression", BOOKTITLE = IbPRIA05, YEAR = "2005", PAGES = "II:571", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329727"} @article{bb335430, AUTHOR = "Li, C. and Li, S. and Zhang, D. and Chen, G.", TITLE = "Cryptanalysis of a data securityp protection scheme for VoIP", JOURNAL = VISP, VOLUME = "153", YEAR = "2006", NUMBER = "1", MONTH = "February", PAGES = "1-10", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329728"} @article{bb335431, AUTHOR = "Sandler, M. and Black, D.", TITLE = "Scalable audio coding for compression and loss resilient streaming", JOURNAL = VISP, VOLUME = "153", YEAR = "2006", NUMBER = "3", MONTH = "June", PAGES = "331-339", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329729"} @article{bb335432, AUTHOR = "Guido, R.C. and Pereira, J.C. and Slaets, J.F.W.", TITLE = "Introduction to the Special Issue: Advances on pattern recognition for speech and audio processing", JOURNAL = PRL, VOLUME = "28", YEAR = "2007", NUMBER = "11", MONTH = "August", PAGES = "1283-1284", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329730"} @article{bb335433, AUTHOR = "Chang, J.H. and Gazor, S. and Kim, N.S. and Mitra, S.K.", TITLE = "Multiple statistical models for soft decision in noisy speech enhancement", JOURNAL = PR, VOLUME = "40", YEAR = "2007", NUMBER = "3", MONTH = "March", PAGES = "1123-1134", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329731"} @article{bb335434, AUTHOR = "Frankel, J. and King, S.", TITLE = "Factoring Gaussian precision matrices for linear dynamic models", JOURNAL = PRL, VOLUME = "28", YEAR = "2007", NUMBER = "16", MONTH = "December", PAGES = "2264-2272", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329732"} @article{bb335435, AUTHOR = "Arias Londono, J.D. and Godino Llorente, J.I. and Saenz Lechon, N. and Osma Ruiz, V. and Castellanos Dominguez, C.G.", TITLE = "An improved method for voice pathology detection by means of a HMM-based feature space transformation", JOURNAL = PR, VOLUME = "43", YEAR = "2010", NUMBER = "9", MONTH = "September", PAGES = "3100-3112", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329733"} @article{bb335436, AUTHOR = "Mahdi, A.E. and Picovici, D.", TITLE = "New single-ended objective measure for non-intrusive speech quality evaluation", JOURNAL = SIViP, VOLUME = "4", YEAR = "2010", NUMBER = "1", MONTH = "March", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329734"} @article{bb335437, AUTHOR = "Guijarrubia, V.G. and Torres, M.I.", TITLE = "Text- and speech-based phonotactic models for spoken language identification of Basque and Spanish", JOURNAL = PRL, VOLUME = "31", YEAR = "2010", NUMBER = "6", MONTH = "April", PAGES = "523-532", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329735"} @inproceedings{bb335438, AUTHOR = "Guijarrubia, V.G. and Torres, M.I.", TITLE = "Comparative Study of Several Phonotactic-Based Approaches to Spanish-Basque Language Identification", BOOKTITLE = CIARP08, YEAR = "2008", PAGES = "128-135", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329736"} @inproceedings{bb335439, AUTHOR = "Guijarrubia, V.G. and Torres, M.I.", TITLE = "Phone-Segments Based Language Identification for Spanish, Basque and English", BOOKTITLE = CIARP07, YEAR = "2007", PAGES = "106-114", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329737"} @inproceedings{bb335440, AUTHOR = "Guijarrubia, V.G. and Torres, M.I.", TITLE = "Language Identification Based on Phone Decoding for Basque and Spanish", BOOKTITLE = IbPRIA07, YEAR = "2007", PAGES = "I: 233-240", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329738"} @article{bb335441, AUTHOR = "Shafiee, S. and Almasganj, F. and Vazirnezhad, B. and Jafari, A.", TITLE = "A two-stage speech activity detection system considering fractal aspects of prosody", JOURNAL = PRL, VOLUME = "31", YEAR = "2010", NUMBER = "9", MONTH = "July", PAGES = "936-948", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329739"} @article{bb335442, AUTHOR = "Yoon, J.Y. and Park, H.", TITLE = "Improving the Speech Quality of VoIP by Packet Prioritization", JOURNAL = SPLetters, VOLUME = "18", YEAR = "2011", NUMBER = "12", MONTH = "December", PAGES = "725-728", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329740"} @article{bb335443, AUTHOR = "Dennis, J. and Tran, H.D. and Li, H.", TITLE = "Spectrogram Image Feature for Sound Event Classification in Mismatched Conditions", JOURNAL = SPLetters, VOLUME = "18", YEAR = "2011", NUMBER = "2", MONTH = "February", PAGES = "130-133", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329741"} @article{bb335444, AUTHOR = "Liang, Y. and Liu, X.L. and Lou, Y.H. and Shan, B.S.", TITLE = "An improved noise-robust voice activity detector based on hidden semi-Markov models", JOURNAL = PRL, VOLUME = "32", YEAR = "2011", NUMBER = "7", MONTH = "May", PAGES = "1044-1053", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329742"} @inproceedings{bb335445, AUTHOR = "Liu, X.L. and Liang, Y. and Lou, Y.H. and Li, H. and Shan, B.S.", TITLE = "Noise-Robust Voice Activity Detector Based on Hidden Semi-Markov Models", BOOKTITLE = ICPR10, YEAR = "2010", PAGES = "81-84", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329743"} @article{bb335446, AUTHOR = "Mohanty, M.N. and Jena, B.", TITLE = "Analysis of stressed human speech", JOURNAL = IJCVR, VOLUME = "2", YEAR = "2011", NUMBER = "2", PAGES = "180-187", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329744"} @article{bb335447, AUTHOR = "Lopez Moreno, I. and Ramos, D. and Gonzalez Dominguez, J. and Gonzalez Rodriguez, J.", TITLE = "Von Mises-Fisher Models in the Total Variability Subspace for Language Recognition", JOURNAL = SPLetters, VOLUME = "18", YEAR = "2011", NUMBER = "12", MONTH = "December", PAGES = "705-708", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329745"} @article{bb335448, AUTHOR = "Jelassi, S. and Rubino, G.", TITLE = "A study of artificial speech quality assessors of VoIP calls subject to limited bursty packet losses", JOURNAL = JIVP, VOLUME = "2011", YEAR = "2011", NUMBER = "1 2011", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329746"} @article{bb335449, AUTHOR = "Ben Aicha, A. and Ben Jebara, S.", TITLE = "Reduction of musical residual noise using perceptual tools with classic speech denoising techniques", JOURNAL = SIViP, VOLUME = "6", YEAR = "2012", NUMBER = "1", MONTH = "March", PAGES = "85-97", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329747"} @article{bb335450, AUTHOR = "Pulakka, H. and Laaksonen, L. and Myllyla, V. and Yrttiaho, Y. and Alku, P.", TITLE = "Conversational Evaluation of Speech Bandwidth Extension Using a Mobile Handset", JOURNAL = SPLetters, VOLUME = "19", YEAR = "2012", NUMBER = "4", MONTH = "April", PAGES = "203-206", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329748"} @article{bb335451, AUTHOR = "Liang, S. and Liu, W.J. and Jiang, W.", TITLE = "Integrating Binary Mask Estimation With MRF Priors of Cochleagram for Speech Separation", JOURNAL = SPLetters, VOLUME = "19", YEAR = "2012", NUMBER = "10", MONTH = "October", PAGES = "627-630", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329749"} @article{bb335452, AUTHOR = "Esch, T. and Rungeler, M. and Heese, F. and Vary, P.", TITLE = "Estimation of Rapidly Time-Varying Harmonic Noise for Speech Enhancement", JOURNAL = SPLetters, VOLUME = "19", YEAR = "2012", NUMBER = "10", MONTH = "October", PAGES = "659-662", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329750"} @article{bb335453, AUTHOR = "Safavi, S. and Hanani, A. and Russell, M. and Jancovic, P. and Carey, M.J.", TITLE = "Contrasting the Effects of Different Frequency Bands on Speaker and Accent Identification", JOURNAL = SPLetters, VOLUME = "19", YEAR = "2012", NUMBER = "12", MONTH = "December", PAGES = "829-832", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329751"} @article{bb335454, AUTHOR = "Safavi, S. and Khan, U.A.", TITLE = "Revisiting Finite-Time Distributed Algorithms via Successive Nulling of Eigenvalues", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "1", MONTH = "January", PAGES = "54-57", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329752"} @article{bb335455, AUTHOR = "Wu, Z.Z. and Kinnunen, T. and Chng, E.S. and Li, H.Z.", TITLE = "Mixture of Factor Analyzers Using Priors From Non-Parallel Speech for Voice Conversion", JOURNAL = SPLetters, VOLUME = "19", YEAR = "2012", NUMBER = "12", MONTH = "December", PAGES = "914-917", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329753"} @article{bb335456, AUTHOR = "Valero, X. and Alias, F.", TITLE = "Gammatone Cepstral Coefficients: Biologically Inspired Features for Non-Speech Audio Classification", JOURNAL = MultMed, VOLUME = "14", YEAR = "2012", NUMBER = "6", PAGES = "1684-1689", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329754"} @article{bb335457, AUTHOR = "Weninger, F. and Krajewski, J. and Batliner, A. and Schuller, B.", TITLE = "The Voice of Leadership: Models and Performances of Automatic Analysis in Online Speeches", JOURNAL = AffCom, VOLUME = "3", YEAR = "2012", NUMBER = "4 2012", PAGES = "496-508", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329755"} @article{bb335458, AUTHOR = "Gerkmann, T. and Krawczyk, M.", TITLE = "MMSE-Optimal Spectral Amplitude Estimation Given the STFT-Phase", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "2", MONTH = "February", PAGES = "129-132", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329756"} @article{bb335459, AUTHOR = "Kim, H.G. and Jang, G.J. and Park, J.S. and Kim, J.H. and Oh, Y.H.", TITLE = "Particle filtering based pitch sequence correction for monaural speech segregation", JOURNAL = IJIST, VOLUME = "23", YEAR = "2013", NUMBER = "1", MONTH = "March", PAGES = "64-70", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329757"} @article{bb335460, AUTHOR = "Dessein, A. and Cont, A.", TITLE = "An Information-Geometric Approach to Real-Time Audio Segmentation", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "4", MONTH = "April", PAGES = "331-334", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329758"} @article{bb335461, AUTHOR = "Drugman, T.", TITLE = "Residual Excitation Skewness for Automatic Speech Polarity Detection", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "4", MONTH = "April", PAGES = "387-390", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329759"} @article{bb335462, AUTHOR = "Yadav, J. and Rao, K.S.", TITLE = "Detection of Vowel Offset Point From Speech Signal", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "4", MONTH = "April", PAGES = "299-302", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329760"} @article{bb335463, AUTHOR = "Mohammadiha, N. and Martin, R. and Leijon, A.", TITLE = "Spectral Domain Speech Enhancement Using HMM State-Dependent Super-Gaussian Priors", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "3", MONTH = "March", PAGES = "253-256", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329761"} @article{bb335464, AUTHOR = "Taal, C.H. and Jensen, J. and Leijon, A.", TITLE = "On Optimal Linear Filtering of Speech for Near-End Listening Enhancement", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "3", MONTH = "March", PAGES = "225-228", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329762"} @article{bb335465, AUTHOR = "Teng, P. and Jia, Y.", TITLE = "Voice Activity Detection Via Noise Reducing Using Non-Negative Sparse Coding", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "5", MONTH = "May", PAGES = "475-478", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329763"} @article{bb335466, AUTHOR = "Romoli, L. and Cecchi, S. and Piazza, F.", TITLE = "A Combined Approach for Channel Decorrelation in Stereo Acoustic Echo Cancellation Exploiting Time-Varying Frequency Shifting", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "7", PAGES = "717-720", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329764"} @article{bb335467, AUTHOR = "Szurley, J. and Bertrand, A. and Moonen, M.", TITLE = "On the Use of Time-Domain Widely Linear Filtering for Binaural Speech Enhancement", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "7", PAGES = "649-652", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329765"} @article{bb335468, AUTHOR = "Sarria Paja, M. and Falk, T.H.", TITLE = "Whispered Speech Detection in Noise Using Auditory-Inspired Modulation Spectrum Features", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "8", PAGES = "783-786", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329766"} @article{bb335469, AUTHOR = "Ramirez, M.A.", TITLE = "Intra-Predictive Switched Split Vector Quantization of Speech Spectra", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "8", PAGES = "791-794", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329767"} @article{bb335470, AUTHOR = "Ying, D. and Yan, Y.", TITLE = "Robust and Fast Localization of Single Speech Source Using a Planar Array", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "9", PAGES = "909-912", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329768"} @article{bb335471, AUTHOR = "Moller, S. and Heusdens, R.", TITLE = "Objective Estimation of Speech Quality for Communication Systems", JOURNAL = PIEEE, VOLUME = "101", YEAR = "2013", NUMBER = "9", PAGES = "1955-1967", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329769"} @article{bb335472, AUTHOR = "Mowlaee, P. and Saeidi, R.", TITLE = "Iterative Closed-Loop Phase-Aware Single-Channel Speech Enhancement", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "12", PAGES = "1235-1239", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329770"} @article{bb335473, AUTHOR = "Kulmer, J. and Mowlaee, P.", TITLE = "Phase Estimation in Single Channel Speech Enhancement Using Phase Decomposition", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "5", MONTH = "May", PAGES = "598-602", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329771"} @article{bb335474, AUTHOR = "Ganapathy, S. and Pelecanos, J.", TITLE = "Enhancing Frequency Shifted Speech Signals in Single Side-Band Communication", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "12", PAGES = "1231-1234", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329772"} @article{bb335475, AUTHOR = "Traa, J. and Smaragdis, P.", TITLE = "A Wrapped Kalman Filter for Azimuthal Speaker Tracking", JOURNAL = SPLetters, VOLUME = "20", YEAR = "2013", NUMBER = "12", PAGES = "1257-1260", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329773"} @article{bb335476, AUTHOR = "Hu, P.F. and Liu, W.J. and Jiang, W. and Yang, Z.L.", TITLE = "Latent topic model for audio retrieval", JOURNAL = PR, VOLUME = "47", YEAR = "2014", NUMBER = "3", PAGES = "1138-1143", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329774"} @article{bb335477, AUTHOR = "Drugman, T.", TITLE = "Maximum Phase Modeling for Sparse Linear Prediction of Speech", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "2", MONTH = "February", PAGES = "185-189", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329775"} @article{bb335478, AUTHOR = "Xu, Y. and Du, J. and Dai, L.R. and Lee, C.H.", TITLE = "An Experimental Study on Speech Enhancement Based on Deep Neural Networks", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "1", MONTH = "January", PAGES = "65-68", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329776"} @article{bb335479, AUTHOR = "Jin, Y.G. and Shin, J.W. and Kim, N.S.", TITLE = "Spectro-Temporal Filtering for Multichannel Speech Enhancement in Short-Time Fourier Transform Domain", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "3", MONTH = "March", PAGES = "352-355", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329777"} @article{bb335480, AUTHOR = "Kwon, K. and Shin, J.W. and Kim, N.S.", TITLE = "NMF-Based Speech Enhancement Using Bases Update", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "4", MONTH = "April", PAGES = "450-454", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329778"} @article{bb335481, AUTHOR = "Arsikere, H. and Lulich, S.M. and Alwan, A.", TITLE = "Estimating Speaker Height and Subglottal Resonances Using MFCCs and GMMs", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "2", MONTH = "February", PAGES = "159-162", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329779"} @article{bb335482, AUTHOR = "He, L. and Zhang, J. and Liu, Q. and Yin, H. and Lech, M.", TITLE = "Automatic Evaluation of Hypernasality and Consonant Misarticulation in Cleft Palate Speech", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "10", MONTH = "October", PAGES = "1298-1301", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329780"} @article{bb335483, AUTHOR = "Nathwani, K. and Pandit, P. and Hegde, R.M.", TITLE = "Group Delay Based Methods for Speaker Segregation and its Application in Multimedia Information Retrieval", JOURNAL = MultMed, VOLUME = "15", YEAR = "2013", NUMBER = "6", PAGES = "1326-1339", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329781"} @article{bb335484, AUTHOR = "Xie, D. and Zhang, W.B.", TITLE = "Estimating Speech Spectral Amplitude Based on the Nakagami Approximation", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "11", MONTH = "November", PAGES = "1375-1379", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329782"} @article{bb335485, AUTHOR = "Drugman, T. and Stylianou, Y.", TITLE = "Fast Inter-Harmonic Reconstruction for Spectral Envelope Estimation in High-Pitched Voices", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "11", MONTH = "November", PAGES = "1418-1422", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329783"} @article{bb335486, AUTHOR = "Drugman, T. and Stylianou, Y. and Kida, Y. and Akamine, M.", TITLE = "Voice Activity Detection: Merging Source and Filter-based Information", JOURNAL = SPLetters, VOLUME = "23", YEAR = "2016", NUMBER = "2", MONTH = "February", PAGES = "252-256", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329784"} @article{bb335487, AUTHOR = "Zheng, C.S. and Peng, R.H. and Li, J. and Li, X.D.", TITLE = "A Constrained MMSE LP Residual Estimator for Speech Dereverberation in Noisy Environments", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "12", MONTH = "December", PAGES = "1462-1466", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329785"} @article{bb335488, AUTHOR = "Sarma, B.D. and Prasanna, S.R.M.", TITLE = "Analysis of Vocal Tract Constrictions using Zero Frequency Filtering", JOURNAL = SPLetters, VOLUME = "21", YEAR = "2014", NUMBER = "12", MONTH = "December", PAGES = "1481-1485", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329786"} @article{bb335489, AUTHOR = "Kim, M. and Smaragdis, P.", TITLE = "Mixtures of Local Dictionaries for Unsupervised Speech Enhancement", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "3", MONTH = "March", PAGES = "293-297", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329787"} @article{bb335490, AUTHOR = "Kleijn, W.B. and Hendriks, R.C.", TITLE = "A Simple Model of Speech Communication and its Application to Intelligibility Enhancement", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "3", MONTH = "March", PAGES = "303-307", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329788"} @article{bb335491, AUTHOR = "Ko, Y.J.", TITLE = "New feature weighting approaches for speech-act classification", JOURNAL = PRL, VOLUME = "51", YEAR = "2015", NUMBER = "1", PAGES = "107-111", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329789"} @article{bb335492, AUTHOR = "Degottex, G.", TITLE = "A Time Regularization Technique for Discrete Spectral Envelopes Through Frequency Derivative", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "7", MONTH = "July", PAGES = "978-982", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329790"} @article{bb335493, AUTHOR = "Mysore, G.J.", TITLE = "Can we Automatically Transform Speech Recorded on Common Consumer Devices in Real-World Environments into Professional Production Quality Speech?: A Dataset, Insights, and Challenges", JOURNAL = SPLetters, VOLUME = "22", YEAR = "2015", NUMBER = "8", MONTH = "August", PAGES = "1006-1010", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329791"} @article{bb335494, AUTHOR = "Doclo, S. and Kellermann, W. and Makino, S. and Nordholm, S.E.", TITLE = "Multichannel Signal Enhancement Algorithms for Assisted Listening Devices: Exploiting spatial diversity using multiple microphones", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "18-30", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329792"} @article{bb335495, AUTHOR = "Kowalczyk, K. and Thiergart, O. and Taseska, M. and del Galdo, G. and Pulkki, V. and Habets, E.A.P.", TITLE = "Parametric Spatial Sound Processing: A flexible and efficient solution to sound scene acquisition, modification, and reproduction", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "31-42", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329793"} @article{bb335496, AUTHOR = "Kleijn, W.B. and Crespo, J.B. and Hendriks, R.C. and Petkov, P. and Sauert, B. and Vary, P.", TITLE = "Optimizing Speech Intelligibility in a Noisy Environment: A unified view", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "43-54", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329794"} @article{bb335497, AUTHOR = "Gerkmann, T. and Krawczyk Becker, M. and Le Roux, J.", TITLE = "Phase Processing for Single-Channel Speech Enhancement: History and recent advances", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "55-66", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329795"} @article{bb335498, AUTHOR = "Wouters, J. and McDermott, H.J. and Francart, T.", TITLE = "Sound Coding in Cochlear Implants: From electric pulses to hearing", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "67-80", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329796"} @article{bb335499, AUTHOR = "Betlehem, T. and Zhang, W. and Poletti, M.A. and Abhayapala, T.D.", TITLE = "Personal Sound Zones: Delivering interface-free audio to multiple listeners", JOURNAL = SPMag, VOLUME = "32", YEAR = "2015", NUMBER = "2", MONTH = "March", PAGES = "81-91", BIBSOURCE = "http://www.visionbib.com/bibliography/other1024sa1.html#TT329797"}