Keith Price Bibliography Bibtex Entry (ANCHOR 368600 URL http://dx.doi.org/10.1109/ICPR.2002.1048079 TYPE CONFERENCE PAGES III: 728-731 YEAR 2002 MONTH NIL BIBSOURCE http://www.visionbib.com/bibliography/other1023.html#TT362758 VOLUME NIL JOURNAL ICPR02 AUTHOR Tanaka, K. and Kojima, H. and Fujimura, N. and Itoh, Y. TITLE Constructing speech processing systems on universal phonetic codes accompanied with reference acoustic models)


@inproceedings{bb368600,
        AUTHOR = "Tanaka, K. and Kojima, H. and Fujimura, N. and Itoh, Y.",
        TITLE = "Constructing speech processing systems on universal phonetic codes
accompanied with reference acoustic models",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "III: 728-731",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362758"}

@inproceedings{bb368601,
        AUTHOR = "Katz, M. and Meier, H.G. and Dolfing, H. and Klakow, D.",
        TITLE = "Robustness of linear discriminant analysis in automatic speech
recognition",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "III: 371-374",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362759"}

@inproceedings{bb368602,
        AUTHOR = "Vande Wouwer, G. and Scheunders, P. and van Dyck, D.",
        TITLE = "Wavelet-FILVQ classifier for speech analysis",
        BOOKTITLE = ICPR96,
        YEAR = "1996",
        PAGES = "IV: 214-218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362760"}

@inproceedings{bb368603,
        AUTHOR = "Uma, S. and Sridhar, V. and Krishna, G.",
        TITLE = "Time-normalization techniques for speaker-independent isolated word
recognition",
        BOOKTITLE = ICPR92,
        YEAR = "1992",
        PAGES = "III:537-540",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362761"}

@inproceedings{bb368604,
        AUTHOR = "Ishikawa, Y. and Nakajima, K.",
        TITLE = "A real time connected word recognition system",
        BOOKTITLE = ICPR90,
        YEAR = "1990",
        PAGES = "II: 215-217",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1023.html#TT362762"}

@article{bb368605,
        AUTHOR = "Huo, Q.A. and Chan, C.",
        TITLE = "Contextual vector quantization for speech recognition with discrete
hidden Markov model",
        JOURNAL = PR,
        VOLUME = "28",
        YEAR = "1995",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "513-517",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362763"}

@article{bb368606,
        AUTHOR = "Kenny, P. and Lennig, M. and Mermelstein, P.",
        TITLE = "Speaker adaptation in a large-vocabulary Gaussian HMM recognizer",
        JOURNAL = PAMI,
        VOLUME = "12",
        YEAR = "1990",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "917-920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362764"}

@article{bb368607,
        AUTHOR = "Kwong, S. and He, Q.H. and Man, K.F. and Tang, K.S.",
        TITLE = "A maximum model distance approach for HMM-based speech recognition",
        JOURNAL = PR,
        VOLUME = "31",
        YEAR = "1998",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "219-229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362765"}

@article{bb368608,
        AUTHOR = "He, Q.H. and Kwong, S. and Man, K.F. and Tang, K.S.",
        TITLE = "An improved maximum model distance approach for HMM-based speech
recognition systems",
        JOURNAL = PR,
        VOLUME = "33",
        YEAR = "2000",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1749-1758",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362766"}

@article{bb368609,
        AUTHOR = "Ding, I.J.",
        TITLE = "Incremental MLLR speaker adaptation by fuzzy logic control",
        JOURNAL = PR,
        VOLUME = "40",
        YEAR = "2007",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3110-3119",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362767"}

@article{bb368610,
        AUTHOR = "Liu, J.W. and Wang, Z.Y. and Xiao, X.",
        TITLE = "A hybrid SVM/DDBHMM decision fusion modeling for robust continuous
digital speech recognition",
        JOURNAL = PRL,
        VOLUME = "28",
        YEAR = "2007",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "912-920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362768"}

@article{bb368611,
        AUTHOR = "O'Shaughnessy, D.",
        TITLE = "Invited paper: Automatic speech recognition: History, methods and
challenges",
        JOURNAL = PR,
        VOLUME = "41",
        YEAR = "2008",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2965-2979",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362769"}

@article{bb368612,
        AUTHOR = "Zeng, J. and Xie, L. and Liu, Z.Q.",
        TITLE = "Type-2 fuzzy Gaussian mixture models",
        JOURNAL = PR,
        VOLUME = "41",
        YEAR = "2008",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "3636-3643",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362770"}

@inproceedings{bb368613,
        AUTHOR = "Zeng, J. and Liu, Z.Q.",
        TITLE = "Type-2 fuzzy hidden markov models to phoneme recognition",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "I: 192-195",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362771"}

@article{bb368614,
        AUTHOR = "Milone, D.H. and di Persia, L.E. and Torres, M.E.",
        TITLE = "Denoising and recognition using hidden Markov models with observation
distributions modeled by hidden Markov trees",
        JOURNAL = PR,
        VOLUME = "43",
        YEAR = "2010",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "1577-1589",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362772"}

@article{bb368615,
        AUTHOR = "Heracleous, P. and Badin, P. and Bailly, G. and Hagita, N.",
        TITLE = "A pilot study on augmented speech communication based on
Electro-Magnetic Articulography",
        JOURNAL = PRL,
        VOLUME = "32",
        YEAR = "2011",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "1119-1125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362773"}

@article{bb368616,
        AUTHOR = "Zamani, B. and Akbari, A. and Nasersharif, B. and Jalalvand, A.",
        TITLE = "Optimized discriminative transformations for speech features based on
minimum classification error",
        JOURNAL = PRL,
        VOLUME = "32",
        YEAR = "2011",
        NUMBER = "7",
        MONTH = "May",
        PAGES = "948-955",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362774"}

@article{bb368617,
        AUTHOR = "Im, J.H. and Lee, S.Y.",
        TITLE = "Unified Training of Feature Extractor and HMM Classifier for Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "111-114",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362775"}

@article{bb368618,
        AUTHOR = "Lee, L.M. and Jean, F.R.",
        TITLE = "Adaptation of Hidden Markov Models for Recognizing Speech of Reduced
Frame Rate",
        JOURNAL = Cyber,
        VOLUME = "43",
        YEAR = "2013",
        NUMBER = "6",
        PAGES = "2114-2121",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362776"}

@article{bb368619,
        AUTHOR = "Cho, J.W. and Park, H.M.",
        TITLE = "An Efficient HMM-Based Feature Enhancement Method With Filter
Estimation for Reverberant Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "12",
        PAGES = "1199-1202",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362777"}

@article{bb368620,
        AUTHOR = "Chung, Y.J.",
        TITLE = "Vector Taylor series based model adaptation using noisy speech
trained hidden Markov models",
        JOURNAL = PRL,
        VOLUME = "75",
        YEAR = "2016",
        NUMBER = "1",
        PAGES = "36-40",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362778"}

@article{bb368621,
        AUTHOR = "Shahnawazuddin, S. and Adiga, N. and Kathania, H.K.",
        TITLE = "Effect of Prosody Modification on Children's ASR",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "1749-1753",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362779"}

@article{bb368622,
        AUTHOR = "Baltrusaitis, T. and Ahuja, C. and Morency, L.P.",
        TITLE = "Multimodal Machine Learning: A Survey and Taxonomy",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "423-443",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362780"}

@article{bb368623,
        AUTHOR = "Hsiao, R. and Can, D. and Ng, T. and Travadi, R. and Ghoshal, A.",
        TITLE = "Online Automatic Speech Recognition With Listen, Attend and Spell
Model",
        JOURNAL = SPLetters,
        VOLUME = "27",
        YEAR = "2020",
        PAGES = "1889-1893",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362781"}

@article{bb368624,
        AUTHOR = "Qiu, J.Y. and Wang, X.C. and Fua, P. and Tao, D.C.",
        TITLE = "Matching Seqlets: An Unsupervised Approach for Locality Preserving
Sequence Matching",
        JOURNAL = PAMI,
        VOLUME = "43",
        YEAR = "2021",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "745-752",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362782"}

@article{bb368625,
        AUTHOR = "de Souza, D.B. and Bakri, K.J. and de Souza Ferreira, F. and Inacio, J.",
        TITLE = "Multitaper-Mel Spectrograms for Keyword Spotting",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "2028-2032",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362783"}

@inproceedings{bb368626,
        AUTHOR = "Ezzine, A. and Satori, H. and Hamidi, M. and Satori, K.",
        TITLE = "Moroccan Dialect Speech Recognition System Based on CMU SphinxTools",
        BOOKTITLE = ISCV20,
        YEAR = "2020",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362784"}

@inproceedings{bb368627,
        AUTHOR = "Shahin, M. and Ji, J.X. and Ahmed, B.",
        TITLE = "One-Class SVMs Based Pronunciation Verification Approach",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2881-2886",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362785"}

@inproceedings{bb368628,
        AUTHOR = "Addarrazi, I. and Satori, H. and Satori, K.",
        TITLE = "Amazigh audiovisual speech recognition system design",
        BOOKTITLE = ISCV17,
        YEAR = "2017",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362786"}

@inproceedings{bb368629,
        AUTHOR = "Wu, C. and Ng, R.W.M. and Torralba, O.S. and Hain, T.",
        TITLE = "Analysing acoustic model changes for active learning in automatic
speech recognition",
        BOOKTITLE = WSSIP17,
        YEAR = "2017",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362787"}

@inproceedings{bb368630,
        AUTHOR = "Asadullah and Shaukat, A. and Ali, H. and Akram, U.",
        TITLE = "Automatic Urdu Speech Recognition using Hidden Markov Model",
        BOOKTITLE = ICIVC16,
        YEAR = "2016",
        PAGES = "135-139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362788"}

@inproceedings{bb368631,
        AUTHOR = "Conka, D. and Viszlay, P. and Juhar, J.",
        TITLE = "Fuzzy clustering in HMM-based triphone classes of 2DLDA in Slovak
LVCSR",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362789"}

@inproceedings{bb368632,
        AUTHOR = "Kacur, J. and Kozicka, R. and Vargic, R.",
        TITLE = "Semi-tight covariance matrices implementation in MASPER HMM training
procedure",
        BOOKTITLE = WSSIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362790"}

@inproceedings{bb368633,
        AUTHOR = "Kacur, J. and Trnovsky, T. and Vargic, R.",
        TITLE = "Discriminative training of HMM using MASPER procedure",
        BOOKTITLE = WSSIP15,
        YEAR = "2015",
        PAGES = "93-96",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362791"}

@inproceedings{bb368634,
        AUTHOR = "Perez Maldonado, Y. and Caballero Morales, S.O. and Cruz Ortega, R.O.",
        TITLE = "GA Approaches to HMM Optimization for Automatic Speech Recognition",
        BOOKTITLE = MCPR12,
        YEAR = "2012",
        PAGES = "313-322",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362792"}

@inproceedings{bb368635,
        AUTHOR = "Swietojanski, P. and Wielgat, R. and Zielinski, T.",
        TITLE = "Automatic Selection of Pareto-Optimal Topologies of Hidden Markov
Models Using Multicriteria Evolutionary Algorithms",
        BOOKTITLE = EvoIASP11,
        YEAR = "2011",
        PAGES = "224-233",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362793"}

@inproceedings{bb368636,
        AUTHOR = "Ravinder, K.",
        TITLE = "Comparison of HMM and DTW for Isolated Word Recognition System of
Punjabi Language",
        BOOKTITLE = CIARP10,
        YEAR = "2010",
        PAGES = "244-252",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362794"}

@inproceedings{bb368637,
        AUTHOR = "Duan, Q.S. and Kang, S.Y. and Wu, Z.Y. and Cai, L.H. and Shuang, Z.W. and Qin, Y.",
        TITLE = "Comparison of Syllable/Phone HMM Based Mandarin TTS",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4496-4499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362795"}

@inproceedings{bb368638,
        AUTHOR = "Kacur, J. and Rozinaj, G.",
        TITLE = "Adding Voicing Features into Speech Recognition Based on HMM in Slovak",
        BOOKTITLE = WSSIP09,
        YEAR = "2009",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362796"}

@inproceedings{bb368639,
        AUTHOR = "Kruger, S.E. and Schaffoner, M. and Katz, M. and Andelic, E. and Wendemuth, A.",
        TITLE = "Mixture of Support Vector Machines for HMM based Speech Recognition",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "IV: 326-329",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362797"}

@inproceedings{bb368640,
        AUTHOR = "Andelic, E. and Schaffoner, M. and Katz, M. and Kruger, S.E.",
        TITLE = "A Hybrid HMM-Based Speech Recognizer Using Kernel-Based Discriminants
as Acoustic Models",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "II: 1158-1161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362798"}

@inproceedings{bb368641,
        AUTHOR = "Demirekler, M. and Karahan, F. and Ciloglu, T.",
        TITLE = "Fusing length and voicing information, and HMM decision using a
Bayesian causal tree against insufficient training data",
        BOOKTITLE = ICPR00,
        YEAR = "2000",
        PAGES = "Vol III: 102-105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362799"}

@inproceedings{bb368642,
        AUTHOR = "Steidl, S. and Stemmer, G. and Hacker, C. and Noth, E. and Niemann, H.",
        TITLE = "Improving Children's Speech Recognition by HMM Interpolation with an
Adults' Speech Recognizer",
        BOOKTITLE = DAGM03,
        YEAR = "2003",
        PAGES = "600-607",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362800"}

@inproceedings{bb368643,
        AUTHOR = "Nouza, J.",
        TITLE = "Feature selection methods for hidden Markov model-based speech
recognition",
        BOOKTITLE = ICPR96,
        YEAR = "1996",
        PAGES = "II: 186-190",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362801"}

@inproceedings{bb368644,
        AUTHOR = "Rieck, S. and Schukat Talamazzini, E.G. and Niemann, H.",
        TITLE = "Speaker adaptation using semi-continuous hidden Markov models",
        BOOKTITLE = ICPR92,
        YEAR = "1992",
        PAGES = "III:541-544",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024hmm2.html#TT362802"}

@article{bb368645,
        AUTHOR = "Wu, J.X. and Chan, C.",
        TITLE = "Isolated word recognition by neural network models with
cross-correlation coefficients for speech dynamics",
        JOURNAL = PAMI,
        VOLUME = "15",
        YEAR = "1993",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "1174-1185",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362803"}

@article{bb368646,
        AUTHOR = "Chen, W.Y. and Liao, Y.F. and Chen, S.H.",
        TITLE = "Speech recognition with hierarchical recurrent neural networks",
        JOURNAL = PR,
        VOLUME = "28",
        YEAR = "1995",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "795-805",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362804"}

@article{bb368647,
        AUTHOR = "Lee, T. and Ching, P.C. and Chan, L.W.",
        TITLE = "Isolated word recognition using modular recurrent neural networks",
        JOURNAL = PR,
        VOLUME = "31",
        YEAR = "1998",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "751-760",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362805"}

@article{bb368648,
        AUTHOR = "Stavrakoudis, D.G. and Theocharis, J.B.",
        TITLE = "Pipelined Recurrent Fuzzy Neural Networks for Nonlinear Adaptive Speech
Prediction",
        JOURNAL = SMC-B,
        VOLUME = "37",
        YEAR = "2007",
        NUMBER = "5",
        MONTH = "October",
        PAGES = "1305-1320",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362806"}

@article{bb368649,
        AUTHOR = "Kay, S.",
        TITLE = "A New Approach to Fourier Synthesis With Application to Neural Encoding
and Speech Classification",
        JOURNAL = SPLetters,
        VOLUME = "17",
        YEAR = "2010",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "855-858",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362807"}

@article{bb368650,
        AUTHOR = "Kay, S.",
        TITLE = "A New Proof of the Neyman-Pearson Theorem Using the EEF and the
Vindication of Sir R. Fisher",
        JOURNAL = SPLetters,
        VOLUME = "19",
        YEAR = "2012",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "451-454",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362808"}

@article{bb368651,
        AUTHOR = "Scanzio, S. and Cumani, S. and Gemello, R. and Mana, F. and Laface, P.",
        TITLE = "Parallel implementation of Artificial Neural Network training for
speech recognition",
        JOURNAL = PRL,
        VOLUME = "31",
        YEAR = "2010",
        NUMBER = "11",
        MONTH = "August",
        PAGES = "1302-1309",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362809"}

@article{bb368652,
        AUTHOR = "Siniscalchi, S.M. and Yu, D. and Deng, L. and Lee, C.H.",
        TITLE = "Speech Recognition Using Long-Span Temporal Patterns in a Deep Network
Model",
        JOURNAL = SPLetters,
        VOLUME = "20",
        YEAR = "2013",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "201-204",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362810"}

@article{bb368653,
        AUTHOR = "Hutchinson, B. and Deng, L. and Yu, D.",
        TITLE = "Tensor Deep Stacking Networks",
        JOURNAL = PAMI,
        VOLUME = "35",
        YEAR = "2013",
        NUMBER = "8",
        PAGES = "1944-1957",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362811"}

@article{bb368654,
        AUTHOR = "Bengio, Y. and Courville, A. and Vincent, P.",
        TITLE = "Representation Learning: A Review and New Perspectives",
        JOURNAL = PAMI,
        VOLUME = "35",
        YEAR = "2013",
        NUMBER = "8",
        PAGES = "1798-1828",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362812"}

@article{bb368655,
        AUTHOR = "Swietojanski, P. and Ghoshal, A. and Renals, S.",
        TITLE = "Convolutional Neural Networks for Distant Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "21",
        YEAR = "2014",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1120-1124",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362813"}

@article{bb368656,
        AUTHOR = "Espi, M. and Fujimoto, M. and Nakatani, T.",
        TITLE = "Acoustic Event Detection in Speech Overlapping Scenarios Based on
High-Resolution Spectral Input and Deep Learning",
        JOURNAL = IEICE,
        VOLUME = "E98-D",
        YEAR = "2015",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1799-1807",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362814"}

@article{bb368657,
        AUTHOR = "Richardson, F. and Reynolds, D. and Dehak, N.",
        TITLE = "Deep Neural Network Approaches to Speaker and Language Recognition",
        JOURNAL = SPLetters,
        VOLUME = "22",
        YEAR = "2015",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1671-1675",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362815"}

@article{bb368658,
        AUTHOR = "Trentin, E.",
        TITLE = "Maximum-likelihood normalization of features increases the robustness
of neural-based spoken human-computer interaction",
        JOURNAL = PRL,
        VOLUME = "66",
        YEAR = "2015",
        NUMBER = "1",
        PAGES = "71-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362816"}

@article{bb368659,
        AUTHOR = "Lee, H.Y. and Cho, J.W. and Kim, M. and Park, H.M.",
        TITLE = "DNN-Based Feature Enhancement Using DOA-Constrained ICA for Robust
Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "23",
        YEAR = "2016",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1091-1095",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362817"}

@article{bb368660,
        AUTHOR = "Sangeetha, J. and Jothilakshmi, S.",
        TITLE = "Automatic continuous speech recogniser for Dravidian languages using
the auto associative neural network",
        JOURNAL = IJCVR,
        VOLUME = "6",
        YEAR = "2016",
        NUMBER = "1-2",
        PAGES = "113-126",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362818"}

@article{bb368661,
        AUTHOR = "Fredes, J. and Novoa, J. and King, S. and Stern, R.M. and Yoma, N.B.",
        TITLE = "Locally Normalized Filter Banks Applied to Deep Neural-Network-Based
Robust Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "377-381",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362819"}

@article{bb368662,
        AUTHOR = "Shahnawazuddin, S. and Sinha, R. and Pradhan, G.",
        TITLE = "Pitch-Normalized Acoustic Features for Robust Children's Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1128-1132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362820"}

@article{bb368663,
        AUTHOR = "Gosztolya, G. and Toth, L.",
        TITLE = "DNN-Based Feature Extraction for Conflict Intensity Estimation From
Speech",
        JOURNAL = SPLetters,
        VOLUME = "24",
        YEAR = "2017",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "1837-1841",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362821"}

@inproceedings{bb368664,
        AUTHOR = "Gosztolya, G. and Banhalmi, A. and Toth, L.",
        TITLE = "Using One-Class Classification Techniques in the Anti-phoneme Problem",
        BOOKTITLE = IbPRIA09,
        YEAR = "2009",
        PAGES = "433-440",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362822"}

@article{bb368665,
        AUTHOR = "Kim, M. and Kim, H.",
        TITLE = "Integrated neural network model for identifying speech acts,
predicators, and sentiments of dialogue utterances",
        JOURNAL = PRL,
        VOLUME = "101",
        YEAR = "2018",
        NUMBER = "1",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362823"}

@article{bb368666,
        AUTHOR = "Affonso, E.T. and Rosa, R.L. and Rodriguez, D.Z.",
        TITLE = "Speech Quality Assessment Over Lossy Transmission Channels Using Deep
Belief Networks",
        JOURNAL = SPLetters,
        VOLUME = "25",
        YEAR = "2018",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "70-74",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362824"}

@article{bb368667,
        AUTHOR = "Kim, H.G. and Lee, H. and Kim, G. and Oh, S.H. and Lee, S.Y.",
        TITLE = "Rescoring of N-Best Hypotheses Using Top-Down Selective Attention for
Automatic Speech Recognition",
        JOURNAL = SPLetters,
        VOLUME = "25",
        YEAR = "2018",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "199-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362825"}

@article{bb368668,
        AUTHOR = "Kaushik, L. and Sangwan, A. and Hansen, J.H.L.",
        TITLE = "Speech Activity Detection in Naturalistic Audio Environments:
Fearless Steps Apollo Corpus",
        JOURNAL = SPLetters,
        VOLUME = "25",
        YEAR = "2018",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1290-1294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362826"}

@article{bb368669,
        AUTHOR = "Heracleous, P. and Even, J. and Sugaya, F. and Hashimoto, M. and Yoneyama, A.",
        TITLE = "Exploiting alternative acoustic sensors for improved noise robustness
in speech communication",
        JOURNAL = PRL,
        VOLUME = "112",
        YEAR = "2018",
        PAGES = "191-197",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362827"}

@article{bb368670,
        AUTHOR = "Takahashi, N. and Gygli, M. and Van Gool, L.J.",
        TITLE = "AENet: Learning Deep Audio Features for Video Analysis",
        JOURNAL = MultMed,
        VOLUME = "20",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "513-524",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362828"}

@article{bb368671,
        AUTHOR = "Cho, B.J. and Lee, J. and Park, H.",
        TITLE = "A Beamforming Algorithm Based on Maximum Likelihood of a Complex
Gaussian Distribution With Time-Varying Variances for Robust Speech
Recognition",
        JOURNAL = SPLetters,
        VOLUME = "26",
        YEAR = "2019",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1398-1402",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362829"}

@article{bb368672,
        AUTHOR = "Gundogdu, B. and Yusuf, B. and Saraclar, M.",
        TITLE = "Generative RNNs for OOV Keyword Search",
        JOURNAL = SPLetters,
        VOLUME = "26",
        YEAR = "2019",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "124-128",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362830"}

@article{bb368673,
        AUTHOR = "Seshadri, S. and Rasanen, O.",
        TITLE = "SylNet: An Adaptable End-to-End Syllable Count Estimator for Speech",
        JOURNAL = SPLetters,
        VOLUME = "26",
        YEAR = "2019",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "1359-1363",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362831"}

@article{bb368674,
        AUTHOR = "Last, P. and Engelbrecht, H.A. and Kamper, H.",
        TITLE = "Unsupervised Feature Learning for Speech Using Correspondence and
Siamese Networks",
        JOURNAL = SPLetters,
        VOLUME = "27",
        YEAR = "2020",
        PAGES = "421-425",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362832"}

@article{bb368675,
        AUTHOR = "John Wesley, R. and Nayeemulla Khan, A. and Shahina, A.",
        TITLE = "Phoneme classification in reconstructed phase space with
convolutional neural networks",
        JOURNAL = PRL,
        VOLUME = "135",
        YEAR = "2020",
        PAGES = "299-306",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362833"}

@article{bb368676,
        AUTHOR = "Phan, H. and McLoughlin, I.V. and Pham, L. and Chen, O.Y. and Koch, P. and de Vos, M. and Mertins, A.",
        TITLE = "Improving GANs for Speech Enhancement",
        JOURNAL = SPLetters,
        VOLUME = "27",
        YEAR = "2020",
        PAGES = "1700-1704",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362834"}

@article{bb368677,
        AUTHOR = "Wei, W. and Wang, Z. and Mao, X.L. and Zhou, G.Y. and Zhou, P. and Jiang, S.",
        TITLE = "Position-aware self-attention based neural sequence labeling",
        JOURNAL = PR,
        VOLUME = "110",
        YEAR = "2021",
        PAGES = "107636",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362835"}

@article{bb368678,
        AUTHOR = "Gu, R.Z. and Zhang, S.X. and Zou, Y.X. and Yu, D.",
        TITLE = "Complex Neural Spatial Filter: Enhancing Multi-Channel Target Speech
Separation in Complex Domain",
        JOURNAL = SPLetters,
        VOLUME = "28",
        YEAR = "2021",
        PAGES = "1370-1374",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362836"}

@article{bb368679,
        AUTHOR = "Li, Y.X. and Wang, W. and Liu, M. and Jiang, Z.J. and He, Q.H.",
        TITLE = "Speaker Clustering by Co-Optimizing Deep Representation Learning and
Cluster Estimation",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "3377-3387",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362837"}

@article{bb368680,
        AUTHOR = "Esmaeilpour, M. and Chaalia, N. and Cardinal, P.",
        TITLE = "RSD-GAN: Regularized Sobolev Defense GAN Against Speech-to-Text
Adversarial Attacks",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "1998-2002",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362838"}

@article{bb368681,
        AUTHOR = "Tian, J.C. and Yu, J.W. and Weng, C. and Zou, Y.X. and Yu, D.",
        TITLE = "Improving Mandarin End-to-End Speech Recognition With Word N-Gram
Language Model",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "812-816",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362839"}

@article{bb368682,
        AUTHOR = "Mai, S.J. and Hu, H.F. and Xing, S.L.",
        TITLE = "A Unimodal Representation Learning and Recurrent Decomposition Fusion
Structure for Utterance-Level Multimodal Embedding Learning",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "2488-2501",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362840"}

@article{bb368683,
        AUTHOR = "Yang, R. and Cheng, G.F. and Zhang, P.Y. and Yan, Y.H.",
        TITLE = "An E2E-ASR-Based Iteratively-Trained Timestamp Estimator",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "1654-1658",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362841"}

@article{bb368684,
        AUTHOR = "Muralikrishna, H. and Aroor Dinesh, D.",
        TITLE = "Spoken language identification in unseen channel conditions using
modified within-sample similarity loss",
        JOURNAL = PRL,
        VOLUME = "158",
        YEAR = "2022",
        PAGES = "16-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362842"}

@article{bb368685,
        AUTHOR = "Nasir, M. and Baucom, B. and Bryan, C. and Narayanan, S. and Georgiou, P.",
        TITLE = "Modeling Vocal Entrainment in Conversational Speech Using Deep
Unsupervised Learning",
        JOURNAL = AffCom,
        VOLUME = "13",
        YEAR = "2022",
        NUMBER = "3",
        MONTH = "July",
        PAGES = "1651-1663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362843"}

@article{bb368686,
        AUTHOR = "Lian, Z. and Chen, L. and Sun, L. and Liu, B. and Tao, J.H.",
        TITLE = "GCNet: Graph Completion Network for Incomplete Multimodal Learning in
Conversation",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "8419-8432",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362844"}

@article{bb368687,
        AUTHOR = "Sun, H.R. and Wang, D. and Li, L. and Chen, C. and Zheng, T.F.",
        TITLE = "Random Cycle Loss and Its Application to Voice Conversion",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "10331-10345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362845"}

@article{bb368688,
        AUTHOR = "Li, L. and Wang, A. and Xu, M. and Dong, Y.F. and Li, X.",
        TITLE = "Abductive natural language inference by interactive model with
structural loss",
        JOURNAL = PRL,
        VOLUME = "177",
        YEAR = "2024",
        PAGES = "82-88",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362846"}

@article{bb368689,
        AUTHOR = "Wang, Q.Q. and Lee, K.A.",
        TITLE = "Cosine Scoring With Uncertainty for Neural Speaker Embedding",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "845-849",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362847"}

@article{bb368690,
        AUTHOR = "Singh, S. and Steinmetz, C.J. and Benetos, E. and Phan, H. and Stowell, D.",
        TITLE = "ATGNN: Audio Tagging Graph Neural Network",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "825-829",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362848"}

@article{bb368691,
        AUTHOR = "Wang, S. and Ni, L. and Zhang, Z. and Li, X.X. and Zheng, X. and Liu, J.",
        TITLE = "Multimodal prediction of student performance: A fusion of signed
graph neural networks and large language models",
        JOURNAL = PRL,
        VOLUME = "181",
        YEAR = "2024",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362849"}

@article{bb368692,
        AUTHOR = "Song, Y.H. and Guo, L. and Man, M. and Wu, Y.X.",
        TITLE = "The spiking neural network based on fMRI for speech recognition",
        JOURNAL = PR,
        VOLUME = "155",
        YEAR = "2024",
        PAGES = "110672",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362850"}

@article{bb368693,
        AUTHOR = "Ma, D. and Yue, X.H. and Ao, J. and Gao, X.X. and Li, H.Z.",
        TITLE = "Text-Guided HuBERT: Self-Supervised Speech Pre-Training via
Generative Adversarial Networks",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2055-2059",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362851"}

@article{bb368694,
        AUTHOR = "Kim, S.S. and Lee, D. and Kang, J.Y. and Jeong, M. and Kim, N.S.",
        TITLE = "Sampling-Based Pruned Knowledge Distillation for Training Lightweight
RNN-T",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "631-635",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362852"}

@inproceedings{bb368695,
        AUTHOR = "Burchi, M. and Timofte, R.",
        TITLE = "Audio-Visual Efficient Conformer for Robust Speech Recognition",
        BOOKTITLE = WACV23,
        YEAR = "2023",
        PAGES = "2257-2266",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362853"}

@inproceedings{bb368696,
        AUTHOR = "Aitoulghazi, O. and Jaafari, A. and Mourhir, A.",
        TITLE = "DarSpeech: An Automatic Speech Recognition System for the Moroccan
Dialect",
        BOOKTITLE = ISCV22,
        YEAR = "2022",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362854"}

@inproceedings{bb368697,
        AUTHOR = "Zhai, M.E. and Dong, L.H. and Qin, Y. and Yu, F.F.",
        TITLE = "The Research of Chain Model Based on CNN-TDNNF in Yulin Dialect
Speech Recognition",
        BOOKTITLE = ICIVC22,
        YEAR = "2022",
        PAGES = "883-888",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362855"}

@inproceedings{bb368698,
        AUTHOR = "Vedvyasan, K. and Nathwani, K. and Hegde, R.M.",
        TITLE = "Group Delay based Methods for Detection and Recognition of Whispered
Speech",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "499-505",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362856"}

@inproceedings{bb368699,
        AUTHOR = "Toufa, A.S. and Kotropoulos, C.",
        TITLE = "Digit Recognition Applied to Reconstructed Audio Signals Using Deep
Learning",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "3050-3057",
        BIBSOURCE = "http://www.visionbib.com/bibliography/other1024snn1.html#TT362857"}
Last update:Nov 2, 2025 at 14:03:07