@inproceedings{bb368600,
AUTHOR = "Tanaka, K. and Kojima, H. and Fujimura, N. and Itoh, Y.",
TITLE = "Constructing speech processing systems on universal phonetic codes
accompanied with reference acoustic models",
BOOKTITLE = ICPR02,
YEAR = "2002",
PAGES = "III: 728-731",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362758"}
@inproceedings{bb368601,
AUTHOR = "Katz, M. and Meier, H.G. and Dolfing, H. and Klakow, D.",
TITLE = "Robustness of linear discriminant analysis in automatic speech
recognition",
BOOKTITLE = ICPR02,
YEAR = "2002",
PAGES = "III: 371-374",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362759"}
@inproceedings{bb368602,
AUTHOR = "Vande Wouwer, G. and Scheunders, P. and van Dyck, D.",
TITLE = "Wavelet-FILVQ classifier for speech analysis",
BOOKTITLE = ICPR96,
YEAR = "1996",
PAGES = "IV: 214-218",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362760"}
@inproceedings{bb368603,
AUTHOR = "Uma, S. and Sridhar, V. and Krishna, G.",
TITLE = "Time-normalization techniques for speaker-independent isolated word
recognition",
BOOKTITLE = ICPR92,
YEAR = "1992",
PAGES = "III:537-540",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362761"}
@inproceedings{bb368604,
AUTHOR = "Ishikawa, Y. and Nakajima, K.",
TITLE = "A real time connected word recognition system",
BOOKTITLE = ICPR90,
YEAR = "1990",
PAGES = "II: 215-217",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362762"}
@article{bb368605,
AUTHOR = "Huo, Q.A. and Chan, C.",
TITLE = "Contextual vector quantization for speech recognition with discrete
hidden Markov model",
JOURNAL = PR,
VOLUME = "28",
YEAR = "1995",
NUMBER = "4",
MONTH = "April",
PAGES = "513-517",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362763"}
@article{bb368606,
AUTHOR = "Kenny, P. and Lennig, M. and Mermelstein, P.",
TITLE = "Speaker adaptation in a large-vocabulary Gaussian HMM recognizer",
JOURNAL = PAMI,
VOLUME = "12",
YEAR = "1990",
NUMBER = "9",
MONTH = "September",
PAGES = "917-920",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362764"}
@article{bb368607,
AUTHOR = "Kwong, S. and He, Q.H. and Man, K.F. and Tang, K.S.",
TITLE = "A maximum model distance approach for HMM-based speech recognition",
JOURNAL = PR,
VOLUME = "31",
YEAR = "1998",
NUMBER = "3",
MONTH = "March",
PAGES = "219-229",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362765"}
@article{bb368608,
AUTHOR = "He, Q.H. and Kwong, S. and Man, K.F. and Tang, K.S.",
TITLE = "An improved maximum model distance approach for HMM-based speech
recognition systems",
JOURNAL = PR,
VOLUME = "33",
YEAR = "2000",
NUMBER = "10",
MONTH = "October",
PAGES = "1749-1758",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362766"}
@article{bb368609,
AUTHOR = "Ding, I.J.",
TITLE = "Incremental MLLR speaker adaptation by fuzzy logic control",
JOURNAL = PR,
VOLUME = "40",
YEAR = "2007",
NUMBER = "11",
MONTH = "November",
PAGES = "3110-3119",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362767"}
@article{bb368610,
AUTHOR = "Liu, J.W. and Wang, Z.Y. and Xiao, X.",
TITLE = "A hybrid SVM/DDBHMM decision fusion modeling for robust continuous
digital speech recognition",
JOURNAL = PRL,
VOLUME = "28",
YEAR = "2007",
NUMBER = "8",
MONTH = "June",
PAGES = "912-920",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362768"}
@article{bb368611,
AUTHOR = "O'Shaughnessy, D.",
TITLE = "Invited paper: Automatic speech recognition: History, methods and
challenges",
JOURNAL = PR,
VOLUME = "41",
YEAR = "2008",
NUMBER = "10",
MONTH = "October",
PAGES = "2965-2979",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362769"}
@article{bb368612,
AUTHOR = "Zeng, J. and Xie, L. and Liu, Z.Q.",
TITLE = "Type-2 fuzzy Gaussian mixture models",
JOURNAL = PR,
VOLUME = "41",
YEAR = "2008",
NUMBER = "12",
MONTH = "December",
PAGES = "3636-3643",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362770"}
@inproceedings{bb368613,
AUTHOR = "Zeng, J. and Liu, Z.Q.",
TITLE = "Type-2 fuzzy hidden markov models to phoneme recognition",
BOOKTITLE = ICPR04,
YEAR = "2004",
PAGES = "I: 192-195",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362771"}
@article{bb368614,
AUTHOR = "Milone, D.H. and di Persia, L.E. and Torres, M.E.",
TITLE = "Denoising and recognition using hidden Markov models with observation
distributions modeled by hidden Markov trees",
JOURNAL = PR,
VOLUME = "43",
YEAR = "2010",
NUMBER = "4",
MONTH = "April",
PAGES = "1577-1589",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362772"}
@article{bb368615,
AUTHOR = "Heracleous, P. and Badin, P. and Bailly, G. and Hagita, N.",
TITLE = "A pilot study on augmented speech communication based on
Electro-Magnetic Articulography",
JOURNAL = PRL,
VOLUME = "32",
YEAR = "2011",
NUMBER = "8",
MONTH = "June",
PAGES = "1119-1125",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362773"}
@article{bb368616,
AUTHOR = "Zamani, B. and Akbari, A. and Nasersharif, B. and Jalalvand, A.",
TITLE = "Optimized discriminative transformations for speech features based on
minimum classification error",
JOURNAL = PRL,
VOLUME = "32",
YEAR = "2011",
NUMBER = "7",
MONTH = "May",
PAGES = "948-955",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362774"}
@article{bb368617,
AUTHOR = "Im, J.H. and Lee, S.Y.",
TITLE = "Unified Training of Feature Extractor and HMM Classifier for Speech
Recognition",
JOURNAL = SPLetters,
VOLUME = "19",
YEAR = "2012",
NUMBER = "2",
MONTH = "February",
PAGES = "111-114",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362775"}
@article{bb368618,
AUTHOR = "Lee, L.M. and Jean, F.R.",
TITLE = "Adaptation of Hidden Markov Models for Recognizing Speech of Reduced
Frame Rate",
JOURNAL = Cyber,
VOLUME = "43",
YEAR = "2013",
NUMBER = "6",
PAGES = "2114-2121",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362776"}
@article{bb368619,
AUTHOR = "Cho, J.W. and Park, H.M.",
TITLE = "An Efficient HMM-Based Feature Enhancement Method With Filter
Estimation for Reverberant Speech Recognition",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "12",
PAGES = "1199-1202",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362777"}
@article{bb368620,
AUTHOR = "Chung, Y.J.",
TITLE = "Vector Taylor series based model adaptation using noisy speech
trained hidden Markov models",
JOURNAL = PRL,
VOLUME = "75",
YEAR = "2016",
NUMBER = "1",
PAGES = "36-40",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362778"}
@article{bb368621,
AUTHOR = "Shahnawazuddin, S. and Adiga, N. and Kathania, H.K.",
TITLE = "Effect of Prosody Modification on Children's ASR",
JOURNAL = SPLetters,
VOLUME = "24",
YEAR = "2017",
NUMBER = "11",
MONTH = "November",
PAGES = "1749-1753",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362779"}
@article{bb368622,
AUTHOR = "Baltrusaitis, T. and Ahuja, C. and Morency, L.P.",
TITLE = "Multimodal Machine Learning: A Survey and Taxonomy",
JOURNAL = PAMI,
VOLUME = "41",
YEAR = "2019",
NUMBER = "2",
MONTH = "February",
PAGES = "423-443",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362780"}
@article{bb368623,
AUTHOR = "Hsiao, R. and Can, D. and Ng, T. and Travadi, R. and Ghoshal, A.",
TITLE = "Online Automatic Speech Recognition With Listen, Attend and Spell
Model",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "1889-1893",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362781"}
@article{bb368624,
AUTHOR = "Qiu, J.Y. and Wang, X.C. and Fua, P. and Tao, D.C.",
TITLE = "Matching Seqlets: An Unsupervised Approach for Locality Preserving
Sequence Matching",
JOURNAL = PAMI,
VOLUME = "43",
YEAR = "2021",
NUMBER = "2",
MONTH = "February",
PAGES = "745-752",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362782"}
@article{bb368625,
AUTHOR = "de Souza, D.B. and Bakri, K.J. and de Souza Ferreira, F. and Inacio, J.",
TITLE = "Multitaper-Mel Spectrograms for Keyword Spotting",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "2028-2032",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362783"}
@inproceedings{bb368626,
AUTHOR = "Ezzine, A. and Satori, H. and Hamidi, M. and Satori, K.",
TITLE = "Moroccan Dialect Speech Recognition System Based on CMU SphinxTools",
BOOKTITLE = ISCV20,
YEAR = "2020",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362784"}
@inproceedings{bb368627,
AUTHOR = "Shahin, M. and Ji, J.X. and Ahmed, B.",
TITLE = "One-Class SVMs Based Pronunciation Verification Approach",
BOOKTITLE = ICPR18,
YEAR = "2018",
PAGES = "2881-2886",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362785"}
@inproceedings{bb368628,
AUTHOR = "Addarrazi, I. and Satori, H. and Satori, K.",
TITLE = "Amazigh audiovisual speech recognition system design",
BOOKTITLE = ISCV17,
YEAR = "2017",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362786"}
@inproceedings{bb368629,
AUTHOR = "Wu, C. and Ng, R.W.M. and Torralba, O.S. and Hain, T.",
TITLE = "Analysing acoustic model changes for active learning in automatic
speech recognition",
BOOKTITLE = WSSIP17,
YEAR = "2017",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362787"}
@inproceedings{bb368630,
AUTHOR = "Asadullah and Shaukat, A. and Ali, H. and Akram, U.",
TITLE = "Automatic Urdu Speech Recognition using Hidden Markov Model",
BOOKTITLE = ICIVC16,
YEAR = "2016",
PAGES = "135-139",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362788"}
@inproceedings{bb368631,
AUTHOR = "Conka, D. and Viszlay, P. and Juhar, J.",
TITLE = "Fuzzy clustering in HMM-based triphone classes of 2DLDA in Slovak
LVCSR",
BOOKTITLE = WSSIP16,
YEAR = "2016",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362789"}
@inproceedings{bb368632,
AUTHOR = "Kacur, J. and Kozicka, R. and Vargic, R.",
TITLE = "Semi-tight covariance matrices implementation in MASPER HMM training
procedure",
BOOKTITLE = WSSIP16,
YEAR = "2016",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362790"}
@inproceedings{bb368633,
AUTHOR = "Kacur, J. and Trnovsky, T. and Vargic, R.",
TITLE = "Discriminative training of HMM using MASPER procedure",
BOOKTITLE = WSSIP15,
YEAR = "2015",
PAGES = "93-96",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362791"}
@inproceedings{bb368634,
AUTHOR = "Perez Maldonado, Y. and Caballero Morales, S.O. and Cruz Ortega, R.O.",
TITLE = "GA Approaches to HMM Optimization for Automatic Speech Recognition",
BOOKTITLE = MCPR12,
YEAR = "2012",
PAGES = "313-322",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362792"}
@inproceedings{bb368635,
AUTHOR = "Swietojanski, P. and Wielgat, R. and Zielinski, T.",
TITLE = "Automatic Selection of Pareto-Optimal Topologies of Hidden Markov
Models Using Multicriteria Evolutionary Algorithms",
BOOKTITLE = EvoIASP11,
YEAR = "2011",
PAGES = "224-233",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362793"}
@inproceedings{bb368636,
AUTHOR = "Ravinder, K.",
TITLE = "Comparison of HMM and DTW for Isolated Word Recognition System of
Punjabi Language",
BOOKTITLE = CIARP10,
YEAR = "2010",
PAGES = "244-252",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362794"}
@inproceedings{bb368637,
AUTHOR = "Duan, Q.S. and Kang, S.Y. and Wu, Z.Y. and Cai, L.H. and Shuang, Z.W. and Qin, Y.",
TITLE = "Comparison of Syllable/Phone HMM Based Mandarin TTS",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "4496-4499",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362795"}
@inproceedings{bb368638,
AUTHOR = "Kacur, J. and Rozinaj, G.",
TITLE = "Adding Voicing Features into Speech Recognition Based on HMM in Slovak",
BOOKTITLE = WSSIP09,
YEAR = "2009",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362796"}
@inproceedings{bb368639,
AUTHOR = "Kruger, S.E. and Schaffoner, M. and Katz, M. and Andelic, E. and Wendemuth, A.",
TITLE = "Mixture of Support Vector Machines for HMM based Speech Recognition",
BOOKTITLE = ICPR06,
YEAR = "2006",
PAGES = "IV: 326-329",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362797"}
@inproceedings{bb368640,
AUTHOR = "Andelic, E. and Schaffoner, M. and Katz, M. and Kruger, S.E.",
TITLE = "A Hybrid HMM-Based Speech Recognizer Using Kernel-Based Discriminants
as Acoustic Models",
BOOKTITLE = ICPR06,
YEAR = "2006",
PAGES = "II: 1158-1161",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362798"}
@inproceedings{bb368641,
AUTHOR = "Demirekler, M. and Karahan, F. and Ciloglu, T.",
TITLE = "Fusing length and voicing information, and HMM decision using a
Bayesian causal tree against insufficient training data",
BOOKTITLE = ICPR00,
YEAR = "2000",
PAGES = "Vol III: 102-105",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362799"}
@inproceedings{bb368642,
AUTHOR = "Steidl, S. and Stemmer, G. and Hacker, C. and Noth, E. and Niemann, H.",
TITLE = "Improving Children's Speech Recognition by HMM Interpolation with an
Adults' Speech Recognizer",
BOOKTITLE = DAGM03,
YEAR = "2003",
PAGES = "600-607",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362800"}
@inproceedings{bb368643,
AUTHOR = "Nouza, J.",
TITLE = "Feature selection methods for hidden Markov model-based speech
recognition",
BOOKTITLE = ICPR96,
YEAR = "1996",
PAGES = "II: 186-190",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362801"}
@inproceedings{bb368644,
AUTHOR = "Rieck, S. and Schukat Talamazzini, E.G. and Niemann, H.",
TITLE = "Speaker adaptation using semi-continuous hidden Markov models",
BOOKTITLE = ICPR92,
YEAR = "1992",
PAGES = "III:541-544",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362802"}
@article{bb368645,
AUTHOR = "Wu, J.X. and Chan, C.",
TITLE = "Isolated word recognition by neural network models with
cross-correlation coefficients for speech dynamics",
JOURNAL = PAMI,
VOLUME = "15",
YEAR = "1993",
NUMBER = "11",
MONTH = "November",
PAGES = "1174-1185",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362803"}
@article{bb368646,
AUTHOR = "Chen, W.Y. and Liao, Y.F. and Chen, S.H.",
TITLE = "Speech recognition with hierarchical recurrent neural networks",
JOURNAL = PR,
VOLUME = "28",
YEAR = "1995",
NUMBER = "6",
MONTH = "June",
PAGES = "795-805",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362804"}
@article{bb368647,
AUTHOR = "Lee, T. and Ching, P.C. and Chan, L.W.",
TITLE = "Isolated word recognition using modular recurrent neural networks",
JOURNAL = PR,
VOLUME = "31",
YEAR = "1998",
NUMBER = "6",
MONTH = "June",
PAGES = "751-760",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362805"}
@article{bb368648,
AUTHOR = "Stavrakoudis, D.G. and Theocharis, J.B.",
TITLE = "Pipelined Recurrent Fuzzy Neural Networks for Nonlinear Adaptive Speech
Prediction",
JOURNAL = SMC-B,
VOLUME = "37",
YEAR = "2007",
NUMBER = "5",
MONTH = "October",
PAGES = "1305-1320",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362806"}
@article{bb368649,
AUTHOR = "Kay, S.",
TITLE = "A New Approach to Fourier Synthesis With Application to Neural Encoding
and Speech Classification",
JOURNAL = SPLetters,
VOLUME = "17",
YEAR = "2010",
NUMBER = "10",
MONTH = "October",
PAGES = "855-858",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362807"}
@article{bb368650,
AUTHOR = "Kay, S.",
TITLE = "A New Proof of the Neyman-Pearson Theorem Using the EEF and the
Vindication of Sir R. Fisher",
JOURNAL = SPLetters,
VOLUME = "19",
YEAR = "2012",
NUMBER = "8",
MONTH = "August",
PAGES = "451-454",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362808"}
@article{bb368651,
AUTHOR = "Scanzio, S. and Cumani, S. and Gemello, R. and Mana, F. and Laface, P.",
TITLE = "Parallel implementation of Artificial Neural Network training for
speech recognition",
JOURNAL = PRL,
VOLUME = "31",
YEAR = "2010",
NUMBER = "11",
MONTH = "August",
PAGES = "1302-1309",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362809"}
@article{bb368652,
AUTHOR = "Siniscalchi, S.M. and Yu, D. and Deng, L. and Lee, C.H.",
TITLE = "Speech Recognition Using Long-Span Temporal Patterns in a Deep Network
Model",
JOURNAL = SPLetters,
VOLUME = "20",
YEAR = "2013",
NUMBER = "3",
MONTH = "March",
PAGES = "201-204",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362810"}
@article{bb368653,
AUTHOR = "Hutchinson, B. and Deng, L. and Yu, D.",
TITLE = "Tensor Deep Stacking Networks",
JOURNAL = PAMI,
VOLUME = "35",
YEAR = "2013",
NUMBER = "8",
PAGES = "1944-1957",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362811"}
@article{bb368654,
AUTHOR = "Bengio, Y. and Courville, A. and Vincent, P.",
TITLE = "Representation Learning: A Review and New Perspectives",
JOURNAL = PAMI,
VOLUME = "35",
YEAR = "2013",
NUMBER = "8",
PAGES = "1798-1828",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362812"}
@article{bb368655,
AUTHOR = "Swietojanski, P. and Ghoshal, A. and Renals, S.",
TITLE = "Convolutional Neural Networks for Distant Speech Recognition",
JOURNAL = SPLetters,
VOLUME = "21",
YEAR = "2014",
NUMBER = "9",
MONTH = "September",
PAGES = "1120-1124",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362813"}
@article{bb368656,
AUTHOR = "Espi, M. and Fujimoto, M. and Nakatani, T.",
TITLE = "Acoustic Event Detection in Speech Overlapping Scenarios Based on
High-Resolution Spectral Input and Deep Learning",
JOURNAL = IEICE,
VOLUME = "E98-D",
YEAR = "2015",
NUMBER = "10",
MONTH = "October",
PAGES = "1799-1807",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362814"}
@article{bb368657,
AUTHOR = "Richardson, F. and Reynolds, D. and Dehak, N.",
TITLE = "Deep Neural Network Approaches to Speaker and Language Recognition",
JOURNAL = SPLetters,
VOLUME = "22",
YEAR = "2015",
NUMBER = "10",
MONTH = "October",
PAGES = "1671-1675",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362815"}
@article{bb368658,
AUTHOR = "Trentin, E.",
TITLE = "Maximum-likelihood normalization of features increases the robustness
of neural-based spoken human-computer interaction",
JOURNAL = PRL,
VOLUME = "66",
YEAR = "2015",
NUMBER = "1",
PAGES = "71-80",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362816"}
@article{bb368659,
AUTHOR = "Lee, H.Y. and Cho, J.W. and Kim, M. and Park, H.M.",
TITLE = "DNN-Based Feature Enhancement Using DOA-Constrained ICA for Robust
Speech Recognition",
JOURNAL = SPLetters,
VOLUME = "23",
YEAR = "2016",
NUMBER = "8",
MONTH = "August",
PAGES = "1091-1095",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362817"}
@article{bb368660,
AUTHOR = "Sangeetha, J. and Jothilakshmi, S.",
TITLE = "Automatic continuous speech recogniser for Dravidian languages using
the auto associative neural network",
JOURNAL = IJCVR,
VOLUME = "6",
YEAR = "2016",
NUMBER = "1-2",
PAGES = "113-126",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362818"}
@article{bb368661,
AUTHOR = "Fredes, J. and Novoa, J. and King, S. and Stern, R.M. and Yoma, N.B.",
TITLE = "Locally Normalized Filter Banks Applied to Deep Neural-Network-Based
Robust Speech Recognition",
JOURNAL = SPLetters,
VOLUME = "24",
YEAR = "2017",
NUMBER = "4",
MONTH = "April",
PAGES = "377-381",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362819"}
@article{bb368662,
AUTHOR = "Shahnawazuddin, S. and Sinha, R. and Pradhan, G.",
TITLE = "Pitch-Normalized Acoustic Features for Robust Children's Speech
Recognition",
JOURNAL = SPLetters,
VOLUME = "24",
YEAR = "2017",
NUMBER = "8",
MONTH = "August",
PAGES = "1128-1132",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362820"}
@article{bb368663,
AUTHOR = "Gosztolya, G. and Toth, L.",
TITLE = "DNN-Based Feature Extraction for Conflict Intensity Estimation From
Speech",
JOURNAL = SPLetters,
VOLUME = "24",
YEAR = "2017",
NUMBER = "12",
MONTH = "December",
PAGES = "1837-1841",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362821"}
@inproceedings{bb368664,
AUTHOR = "Gosztolya, G. and Banhalmi, A. and Toth, L.",
TITLE = "Using One-Class Classification Techniques in the Anti-phoneme Problem",
BOOKTITLE = IbPRIA09,
YEAR = "2009",
PAGES = "433-440",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362822"}
@article{bb368665,
AUTHOR = "Kim, M. and Kim, H.",
TITLE = "Integrated neural network model for identifying speech acts,
predicators, and sentiments of dialogue utterances",
JOURNAL = PRL,
VOLUME = "101",
YEAR = "2018",
NUMBER = "1",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362823"}
@article{bb368666,
AUTHOR = "Affonso, E.T. and Rosa, R.L. and Rodriguez, D.Z.",
TITLE = "Speech Quality Assessment Over Lossy Transmission Channels Using Deep
Belief Networks",
JOURNAL = SPLetters,
VOLUME = "25",
YEAR = "2018",
NUMBER = "1",
MONTH = "January",
PAGES = "70-74",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362824"}
@article{bb368667,
AUTHOR = "Kim, H.G. and Lee, H. and Kim, G. and Oh, S.H. and Lee, S.Y.",
TITLE = "Rescoring of N-Best Hypotheses Using Top-Down Selective Attention for
Automatic Speech Recognition",
JOURNAL = SPLetters,
VOLUME = "25",
YEAR = "2018",
NUMBER = "2",
MONTH = "February",
PAGES = "199-203",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362825"}
@article{bb368668,
AUTHOR = "Kaushik, L. and Sangwan, A. and Hansen, J.H.L.",
TITLE = "Speech Activity Detection in Naturalistic Audio Environments:
Fearless Steps Apollo Corpus",
JOURNAL = SPLetters,
VOLUME = "25",
YEAR = "2018",
NUMBER = "9",
MONTH = "September",
PAGES = "1290-1294",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362826"}
@article{bb368669,
AUTHOR = "Heracleous, P. and Even, J. and Sugaya, F. and Hashimoto, M. and Yoneyama, A.",
TITLE = "Exploiting alternative acoustic sensors for improved noise robustness
in speech communication",
JOURNAL = PRL,
VOLUME = "112",
YEAR = "2018",
PAGES = "191-197",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362827"}
@article{bb368670,
AUTHOR = "Takahashi, N. and Gygli, M. and Van Gool, L.J.",
TITLE = "AENet: Learning Deep Audio Features for Video Analysis",
JOURNAL = MultMed,
VOLUME = "20",
YEAR = "2018",
NUMBER = "3",
MONTH = "March",
PAGES = "513-524",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362828"}
@article{bb368671,
AUTHOR = "Cho, B.J. and Lee, J. and Park, H.",
TITLE = "A Beamforming Algorithm Based on Maximum Likelihood of a Complex
Gaussian Distribution With Time-Varying Variances for Robust Speech
Recognition",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "9",
MONTH = "September",
PAGES = "1398-1402",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362829"}
@article{bb368672,
AUTHOR = "Gundogdu, B. and Yusuf, B. and Saraclar, M.",
TITLE = "Generative RNNs for OOV Keyword Search",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "1",
MONTH = "January",
PAGES = "124-128",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362830"}
@article{bb368673,
AUTHOR = "Seshadri, S. and Rasanen, O.",
TITLE = "SylNet: An Adaptable End-to-End Syllable Count Estimator for Speech",
JOURNAL = SPLetters,
VOLUME = "26",
YEAR = "2019",
NUMBER = "9",
MONTH = "September",
PAGES = "1359-1363",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362831"}
@article{bb368674,
AUTHOR = "Last, P. and Engelbrecht, H.A. and Kamper, H.",
TITLE = "Unsupervised Feature Learning for Speech Using Correspondence and
Siamese Networks",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "421-425",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362832"}
@article{bb368675,
AUTHOR = "John Wesley, R. and Nayeemulla Khan, A. and Shahina, A.",
TITLE = "Phoneme classification in reconstructed phase space with
convolutional neural networks",
JOURNAL = PRL,
VOLUME = "135",
YEAR = "2020",
PAGES = "299-306",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362833"}
@article{bb368676,
AUTHOR = "Phan, H. and McLoughlin, I.V. and Pham, L. and Chen, O.Y. and Koch, P. and de Vos, M. and Mertins, A.",
TITLE = "Improving GANs for Speech Enhancement",
JOURNAL = SPLetters,
VOLUME = "27",
YEAR = "2020",
PAGES = "1700-1704",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362834"}
@article{bb368677,
AUTHOR = "Wei, W. and Wang, Z. and Mao, X.L. and Zhou, G.Y. and Zhou, P. and Jiang, S.",
TITLE = "Position-aware self-attention based neural sequence labeling",
JOURNAL = PR,
VOLUME = "110",
YEAR = "2021",
PAGES = "107636",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362835"}
@article{bb368678,
AUTHOR = "Gu, R.Z. and Zhang, S.X. and Zou, Y.X. and Yu, D.",
TITLE = "Complex Neural Spatial Filter: Enhancing Multi-Channel Target Speech
Separation in Complex Domain",
JOURNAL = SPLetters,
VOLUME = "28",
YEAR = "2021",
PAGES = "1370-1374",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362836"}
@article{bb368679,
AUTHOR = "Li, Y.X. and Wang, W. and Liu, M. and Jiang, Z.J. and He, Q.H.",
TITLE = "Speaker Clustering by Co-Optimizing Deep Representation Learning and
Cluster Estimation",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "3377-3387",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362837"}
@article{bb368680,
AUTHOR = "Esmaeilpour, M. and Chaalia, N. and Cardinal, P.",
TITLE = "RSD-GAN: Regularized Sobolev Defense GAN Against Speech-to-Text
Adversarial Attacks",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1998-2002",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362838"}
@article{bb368681,
AUTHOR = "Tian, J.C. and Yu, J.W. and Weng, C. and Zou, Y.X. and Yu, D.",
TITLE = "Improving Mandarin End-to-End Speech Recognition With Word N-Gram
Language Model",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "812-816",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362839"}
@article{bb368682,
AUTHOR = "Mai, S.J. and Hu, H.F. and Xing, S.L.",
TITLE = "A Unimodal Representation Learning and Recurrent Decomposition Fusion
Structure for Utterance-Level Multimodal Embedding Learning",
JOURNAL = MultMed,
VOLUME = "24",
YEAR = "2022",
PAGES = "2488-2501",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362840"}
@article{bb368683,
AUTHOR = "Yang, R. and Cheng, G.F. and Zhang, P.Y. and Yan, Y.H.",
TITLE = "An E2E-ASR-Based Iteratively-Trained Timestamp Estimator",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "1654-1658",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362841"}
@article{bb368684,
AUTHOR = "Muralikrishna, H. and Aroor Dinesh, D.",
TITLE = "Spoken language identification in unseen channel conditions using
modified within-sample similarity loss",
JOURNAL = PRL,
VOLUME = "158",
YEAR = "2022",
PAGES = "16-23",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362842"}
@article{bb368685,
AUTHOR = "Nasir, M. and Baucom, B. and Bryan, C. and Narayanan, S. and Georgiou, P.",
TITLE = "Modeling Vocal Entrainment in Conversational Speech Using Deep
Unsupervised Learning",
JOURNAL = AffCom,
VOLUME = "13",
YEAR = "2022",
NUMBER = "3",
MONTH = "July",
PAGES = "1651-1663",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362843"}
@article{bb368686,
AUTHOR = "Lian, Z. and Chen, L. and Sun, L. and Liu, B. and Tao, J.H.",
TITLE = "GCNet: Graph Completion Network for Incomplete Multimodal Learning in
Conversation",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "7",
MONTH = "July",
PAGES = "8419-8432",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362844"}
@article{bb368687,
AUTHOR = "Sun, H.R. and Wang, D. and Li, L. and Chen, C. and Zheng, T.F.",
TITLE = "Random Cycle Loss and Its Application to Voice Conversion",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "8",
MONTH = "August",
PAGES = "10331-10345",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362845"}
@article{bb368688,
AUTHOR = "Li, L. and Wang, A. and Xu, M. and Dong, Y.F. and Li, X.",
TITLE = "Abductive natural language inference by interactive model with
structural loss",
JOURNAL = PRL,
VOLUME = "177",
YEAR = "2024",
PAGES = "82-88",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362846"}
@article{bb368689,
AUTHOR = "Wang, Q.Q. and Lee, K.A.",
TITLE = "Cosine Scoring With Uncertainty for Neural Speaker Embedding",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "845-849",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362847"}
@article{bb368690,
AUTHOR = "Singh, S. and Steinmetz, C.J. and Benetos, E. and Phan, H. and Stowell, D.",
TITLE = "ATGNN: Audio Tagging Graph Neural Network",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "825-829",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362848"}
@article{bb368691,
AUTHOR = "Wang, S. and Ni, L. and Zhang, Z. and Li, X.X. and Zheng, X. and Liu, J.",
TITLE = "Multimodal prediction of student performance: A fusion of signed
graph neural networks and large language models",
JOURNAL = PRL,
VOLUME = "181",
YEAR = "2024",
PAGES = "1-8",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362849"}
@article{bb368692,
AUTHOR = "Song, Y.H. and Guo, L. and Man, M. and Wu, Y.X.",
TITLE = "The spiking neural network based on fMRI for speech recognition",
JOURNAL = PR,
VOLUME = "155",
YEAR = "2024",
PAGES = "110672",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362850"}
@article{bb368693,
AUTHOR = "Ma, D. and Yue, X.H. and Ao, J. and Gao, X.X. and Li, H.Z.",
TITLE = "Text-Guided HuBERT: Self-Supervised Speech Pre-Training via
Generative Adversarial Networks",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "2055-2059",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362851"}
@article{bb368694,
AUTHOR = "Kim, S.S. and Lee, D. and Kang, J.Y. and Jeong, M. and Kim, N.S.",
TITLE = "Sampling-Based Pruned Knowledge Distillation for Training Lightweight
RNN-T",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "631-635",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362852"}
@inproceedings{bb368695,
AUTHOR = "Burchi, M. and Timofte, R.",
TITLE = "Audio-Visual Efficient Conformer for Robust Speech Recognition",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "2257-2266",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362853"}
@inproceedings{bb368696,
AUTHOR = "Aitoulghazi, O. and Jaafari, A. and Mourhir, A.",
TITLE = "DarSpeech: An Automatic Speech Recognition System for the Moroccan
Dialect",
BOOKTITLE = ISCV22,
YEAR = "2022",
PAGES = "1-6",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362854"}
@inproceedings{bb368697,
AUTHOR = "Zhai, M.E. and Dong, L.H. and Qin, Y. and Yu, F.F.",
TITLE = "The Research of Chain Model Based on CNN-TDNNF in Yulin Dialect
Speech Recognition",
BOOKTITLE = ICIVC22,
YEAR = "2022",
PAGES = "883-888",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362855"}
@inproceedings{bb368698,
AUTHOR = "Vedvyasan, K. and Nathwani, K. and Hegde, R.M.",
TITLE = "Group Delay based Methods for Detection and Recognition of Whispered
Speech",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "499-505",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362856"}
@inproceedings{bb368699,
AUTHOR = "Toufa, A.S. and Kotropoulos, C.",
TITLE = "Digit Recognition Applied to Reconstructed Audio Signals Using Deep
Learning",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "3050-3057",
BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362857"}
Last update:Nov 2, 2025 at 14:03:07