@inproceedings{bb288400,
AUTHOR = "Bregler, C. and Omohundro, S.M.",
TITLE = "Learning Visual Models for Lipreading",
BOOKTITLE = MBR97,
YEAR = "1997",
PAGES = "Chapter 13",
BIBSOURCE = "http://www.visionbib.com/bibliography/people915.html#TT283036"}
@inproceedings{bb288401,
AUTHOR = "Bregler, C. and Covell, M. and Slaney, M.",
TITLE = "Video Rewrite: Driving Visual Speech with Audio",
BOOKTITLE = "SIGGraph-97",
YEAR = "1997",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/people915.html#TT283037"}
@inproceedings{bb288402,
AUTHOR = "Bregler, C. and Omohundro, S.",
TITLE = "Nonlinear Manifold Learning for Visual Speech Recognition",
BOOKTITLE = ICCV95,
YEAR = "1995",
PAGES = "494-499",
BIBSOURCE = "http://www.visionbib.com/bibliography/people915.html#TT283038"}
@inproceedings{bb288403,
AUTHOR = "Stork, D.G. and Hennecke, M.E.",
TITLE = "Speechreading: an overview of image processing, feature extraction,
sensory integration and pattern recognition techniques",
BOOKTITLE = AFGR96,
YEAR = "1996",
PAGES = "xvi-xxvi",
BIBSOURCE = "http://www.visionbib.com/bibliography/people915.html#TT283039"}
@article{bb288404,
AUTHOR = "Wu, J.X. and Chan, C.",
TITLE = "Recognition of phonetic labels of the TIMIT speech corpus by means of
an artificial neural network",
JOURNAL = PR,
VOLUME = "24",
YEAR = "1991",
NUMBER = "11",
PAGES = "1085-1091",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283040"}
@article{bb288405,
AUTHOR = "Wu, J.T. and Tamura, S. and Mitsumoto, H. and Kawai, H. and Kurosu, K. and Okazaki, K.",
TITLE = "Neural network vowel-recognition jointly using voice features and mouth
shape image",
JOURNAL = PR,
VOLUME = "24",
YEAR = "1991",
NUMBER = "10",
PAGES = "921-927",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283041"}
@article{bb288406,
AUTHOR = "Movellan, J.R. and Mineiro, P.",
TITLE = "Robust Sensor Fusion:
Analysis and Application to Audio-Visual Speech Recognition",
JOURNAL = MachLearn,
VOLUME = "32",
YEAR = "1998",
NUMBER = "2",
MONTH = "August",
PAGES = "85-100",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283042"}
@article{bb288407,
AUTHOR = "Wachsmuth, S. and Socher, G. and Brandt Pook, H. and Kummert, F. and Sagerer, G.F.",
TITLE = "Integration of Vision and Speech Understanding Using Bayesian Networks",
JOURNAL = Videre,
VOLUME = "1",
YEAR = "2000",
NUMBER = "4",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283043"}
@inproceedings{bb288408,
AUTHOR = "Wachsmuth, S. and Brandt Pook, H. and Socher, G. and Kummert, F. and Sagerer, G.F.",
TITLE = "Multilevel Integration of Vision and Speech Understanding Using
Bayesian Networks",
BOOKTITLE = CVS99,
YEAR = "1999",
PAGES = "231 ff.",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283044"}
@article{bb288409,
AUTHOR = "Patel, D. and Turner, L.F.",
TITLE = "Effects of ATM network impairments on audio-visual broadcast
applications",
JOURNAL = VISP,
VOLUME = "147",
YEAR = "2000",
NUMBER = "5",
MONTH = "October",
PAGES = "436-444",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283045"}
@article{bb288410,
AUTHOR = "Aleksic, P.S. and Williams, J.J. and Wu, Z.L. and Katsaggelos, A.K.",
TITLE = "Audio-Visual Speech Recognition Using MPEG-4 Compliant Visual Features",
JOURNAL = JASP,
VOLUME = "2002",
YEAR = "2002",
NUMBER = "11",
MONTH = "November",
PAGES = "1213",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283046"}
@inproceedings{bb288411,
AUTHOR = "Aleksic, P.S. and Williams, J.J. and Wu, Z.L. and Katsaggelos, A.K.",
TITLE = "Audio-visual continuous speech recognition using MPEG-4 compliant
visual features",
BOOKTITLE = ICIP02,
YEAR = "2002",
PAGES = "I: 960-963",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283047"}
@article{bb288412,
AUTHOR = "Aleksic, P.S. and Katsaggelos, A.K.",
TITLE = "Audio-Visual Biometrics",
JOURNAL = PIEEE,
VOLUME = "94",
YEAR = "2006",
NUMBER = "11",
MONTH = "November",
PAGES = "2025-2044",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283048"}
@article{bb288413,
AUTHOR = "Aleksic, P.S. and Katsaggelos, A.K.",
TITLE = "Speech-to-video synthesis using MPEG-4 compliant visual features",
JOURNAL = CirSysVideo,
VOLUME = "14",
YEAR = "2004",
NUMBER = "5",
MONTH = "May",
PAGES = "682-692",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283049"}
@inproceedings{bb288414,
AUTHOR = "Aleksic, P.S. and Katsaggelos, A.K.",
TITLE = "Comparison of MPEG-4 Facial Animation Parameter Groups with Respect to
Audio-Visual Speech Recognition Performance",
BOOKTITLE = ICIP05,
YEAR = "2005",
PAGES = "III: 501-504",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283050"}
@article{bb288415,
AUTHOR = "Sodoyer, D. and Schwartz, J.L. and Girin, L. and Klinkisch, J. and Jutten, C.",
TITLE = "Separation of Audio-Visual Speech Sources: A New Approach Exploiting
the Audio-Visual Coherence of Speech Stimuli",
JOURNAL = JASP,
VOLUME = "2002",
YEAR = "2002",
NUMBER = "11",
MONTH = "November",
PAGES = "1165",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283051"}
@article{bb288416,
AUTHOR = "Heckmann, M. and Berthommier, F. and Kroschel, K.",
TITLE = "Noise Adaptive Stream Weighting in Audio-Visual Speech Recognition",
JOURNAL = JASP,
VOLUME = "2002",
YEAR = "2002",
NUMBER = "11",
MONTH = "November",
PAGES = "1260",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283052"}
@article{bb288417,
AUTHOR = "Nefian, A.V. and Liang, L.H. and Pi, X.B. and Liu, X.X. and Murphy, K.P.",
TITLE = "Dynamic Bayesian Networks for Audio-Visual Speech Recognition",
JOURNAL = JASP,
VOLUME = "2002",
YEAR = "2002",
NUMBER = "11",
MONTH = "November",
PAGES = "1274",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283053"}
@inproceedings{bb288418,
AUTHOR = "Nefian, A.V. and Liang, L.H. and Fu, T.Y. and Liu, X.X.",
TITLE = "A Bayesian Approach to Audio-Visual Speaker Identification",
BOOKTITLE = AVBPA03,
YEAR = "2003",
PAGES = "761-769",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283054"}
@article{bb288419,
AUTHOR = "Patterson, E.K. and Gurbuz, S. and Tufekci, Z. and Gowdy, J.N.",
TITLE = "Moving-Talker, Speaker-Independent Feature Study, and Baseline Results
Using the CUAVE Multimodal Speech Corpus",
JOURNAL = JASP,
VOLUME = "2002",
YEAR = "2002",
NUMBER = "11",
MONTH = "November",
PAGES = "1189",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283055"}
@inproceedings{bb288420,
AUTHOR = "Gurbuz, S. and Patterson, E.K. and Tufekci, Z. and Gowdy, J.N.",
TITLE = "Affine-Invariant Visual Features Contain Supplementary Information to
Enhance Speech Recognition",
BOOKTITLE = AVBPA01,
YEAR = "2001",
PAGES = "175",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283056"}
@article{bb288421,
AUTHOR = "Kalberer, G.A. and Muller, P. and Van Gool, L.J.",
TITLE = "Visual speech, a trajectory in viseme space",
JOURNAL = IJIST,
VOLUME = "13",
YEAR = "2003",
NUMBER = "1",
PAGES = "74-84",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283057"}
@article{bb288422,
AUTHOR = "Sharma, R. and Yeasin, M. and Krahnstoever, N. and Rauschert, I. and Cai, G. and Brewer, I. and MacEachren, A.M. and Sengupta, K.",
TITLE = "Speech-gesture driven multimodal interfaces for crisis management",
JOURNAL = PIEEE,
VOLUME = "91",
YEAR = "2003",
NUMBER = "9",
MONTH = "September",
PAGES = "1327-1354",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283058"}
@article{bb288423,
AUTHOR = "Potamianos, G. and Neti, C. and Gravier, G. and Garg, A. and Senior, A.W.",
TITLE = "Recent advances in the automatic recognition of audiovisual speech",
JOURNAL = PIEEE,
VOLUME = "91",
YEAR = "2003",
NUMBER = "9",
MONTH = "September",
PAGES = "1306-1326",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283059"}
@article{bb288424,
AUTHOR = "Kaynak, M.N. and Zhi, Q. and Cheok, A.D. and Sengupta, K. and Jian, Z. and Chung, K.C.",
TITLE = "Analysis of Lip Geometric Features for Audio-Visual Speech Recognition",
JOURNAL = SMC-A,
VOLUME = "34",
YEAR = "2004",
NUMBER = "4",
MONTH = "July",
PAGES = "564-570",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283060"}
@article{bb288425,
AUTHOR = "Foo, S.W. and Lian, Y. and Dong, L.",
TITLE = "Recognition of visual speech elements using adaptively boosted hidden
Markov models",
JOURNAL = CirSysVideo,
VOLUME = "14",
YEAR = "2004",
NUMBER = "5",
MONTH = "May",
PAGES = "693-705",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283061"}
@article{bb288426,
AUTHOR = "Albiol, A. and Torres, L. and Delp, E.J.",
TITLE = "Fully automatic face recognition system using a combined audio-visual
approach",
JOURNAL = VISP,
VOLUME = "152",
YEAR = "2005",
NUMBER = "3",
MONTH = "June",
PAGES = "318-326",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283062"}
@inproceedings{bb288427,
AUTHOR = "Albiol, A. and Torres, L. and Delp, E.J.",
TITLE = "A Fast Anchor Person Searching Scheme in News Sequences",
BOOKTITLE = AVBPA01,
YEAR = "2001",
PAGES = "366",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283063"}
@inproceedings{bb288428,
AUTHOR = "Albiol, A. and Torres, L. and Delp, E.J.",
TITLE = "An Unsupervised Color Image Segmentation Algorithm for Face Detection
Applications",
BOOKTITLE = ICIP01,
YEAR = "2001",
PAGES = "II: 681-684",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283064"}
@inproceedings{bb288429,
AUTHOR = "Albiol, A. and Torres, L. and Delp, E.J.",
TITLE = "Optimum Color Spaces for Skin Detection",
BOOKTITLE = ICIP01,
YEAR = "2001",
PAGES = "I: 122-124",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283065"}
@article{bb288430,
AUTHOR = "Kleindienst, J. and Macek, T. and Seredi, L. and Sedivy, J.",
TITLE = "Interaction framework for home environment using speech and vision",
JOURNAL = IVC,
VOLUME = "25",
YEAR = "2007",
NUMBER = "12",
MONTH = "December",
PAGES = "1836-1847",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283066"}
@inproceedings{bb288431,
AUTHOR = "Kleindienst, J. and Macek, T. and Seredi, L. and Sedivy, J.",
TITLE = "Djinn: Interaction Framework for Home Environment Using Speech and
Vision",
BOOKTITLE = CVHCI04,
YEAR = "2004",
PAGES = "153-164",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283067"}
@article{bb288432,
AUTHOR = "Palanivel, S. and Yegnanarayana, B.",
TITLE = "Multimodal person authentication using speech, face and visual speech",
JOURNAL = CVIU,
VOLUME = "109",
YEAR = "2008",
NUMBER = "1",
MONTH = "January",
PAGES = "44-55",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283068"}
@article{bb288433,
AUTHOR = "Chetty, G. and Wagner, M.",
TITLE = "Robust face-voice based speaker identity verification using multilevel
fusion",
JOURNAL = IVC,
VOLUME = "26",
YEAR = "2008",
NUMBER = "9",
MONTH = "September",
PAGES = "1249-1260",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283069"}
@inproceedings{bb288434,
AUTHOR = "Chetty, G. and Wagner, M.",
TITLE = "Audio Visual Speaker Verification Based on Hybrid Fusion of Cross Modal
Features",
BOOKTITLE = PReMI07,
YEAR = "2007",
PAGES = "469-478",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283070"}
@inproceedings{bb288435,
AUTHOR = "Chetty, G. and Wagner, M.",
TITLE = "Face-Voice Authentication Based on 3D Face Models",
BOOKTITLE = ACCV06,
YEAR = "2006",
PAGES = "I:559-568",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283071"}
@article{bb288436,
AUTHOR = "Delakis, M. and Gravier, G. and Gros, P.",
TITLE = "Audiovisual integration with Segment Models for tennis video parsing",
JOURNAL = CVIU,
VOLUME = "111",
YEAR = "2008",
NUMBER = "2",
MONTH = "August",
PAGES = "142-154",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283072"}
@article{bb288437,
AUTHOR = "Gravier, G. and Guinaudeau, C. and Lecorve, G. and Sebillot, P.",
TITLE = "Exploiting Speech for Automatic TV Delinearization:
From Streams to Cross-Media Semantic Navigation",
JOURNAL = JIVP,
VOLUME = "2011",
YEAR = "2011",
NUMBER = "2011",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283073"}
@article{bb288438,
AUTHOR = "Hospedales, T.M. and Vijayakumar, S.",
TITLE = "Structure Inference for Bayesian Multisensory Scene Understanding",
JOURNAL = PAMI,
VOLUME = "30",
YEAR = "2008",
NUMBER = "12",
MONTH = "December",
PAGES = "2140-2157",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283074"}
@article{bb288439,
AUTHOR = "Liu, Z.C. and Cohen, M. and Bhatnagar, D. and Cutler, R. and Zhang, Z.Y.",
TITLE = "Head-Size Equalization for Improved Visual Perception in Video
Conferencing",
JOURNAL = MultMed,
VOLUME = "9",
YEAR = "2007",
NUMBER = "7",
MONTH = "November",
PAGES = "1520-1527",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283075"}
@inproceedings{bb288440,
AUTHOR = "Liu, Z.C. and Cutler, R. and Cohen, M. and Zhang, Z.Y.",
TITLE = "System and method for head size equalization in 360
degree panoramic images",
BOOKTITLE = US_Patent,
YEAR = "2007",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283076"}
@inproceedings{bb288441,
AUTHOR = "Cutler, R.",
TITLE = "User interface for a system and method for head size
equalization in 360 degree panoramic images",
BOOKTITLE = US_Patent,
YEAR = "2006",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283077"}
@inproceedings{bb288442,
AUTHOR = "Cutler, R. and Kapoor, A.",
TITLE = "System and method for audio/video speaker detection",
BOOKTITLE = US_Patent,
YEAR = "2008",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283078"}
@article{bb288443,
AUTHOR = "Heracleous, P. and Aboutabit, N. and Beautemps, D.",
TITLE = "Lip Shape and Hand Position Fusion for Automatic Vowel Recognition in
Cued Speech for French",
JOURNAL = SPLetters,
VOLUME = "16",
YEAR = "2009",
NUMBER = "5",
MONTH = "May",
PAGES = "339-342",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283079"}
@article{bb288444,
AUTHOR = "Zhang, C. and Yin, P. and Rui, Y. and Cutler, R. and Viola, P. and Sun, X.D. and Pinto, N. and Zhang, Z.Y.",
TITLE = "Boosting-Based Multimodal Speaker Detection for Distributed Meeting
Videos",
JOURNAL = MultMed,
VOLUME = "10",
YEAR = "2008",
NUMBER = "8",
MONTH = "December",
PAGES = "1541-1552",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283080"}
@article{bb288445,
AUTHOR = "Lee, J.S. and Park, C.H.",
TITLE = "Robust Audio-Visual Speech Recognition Based on Late Integration",
JOURNAL = MultMed,
VOLUME = "10",
YEAR = "2008",
NUMBER = "5",
MONTH = "August",
PAGES = "767-779",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283081"}
@article{bb288446,
AUTHOR = "Schuller, B. and Muller, R. and Eyben, F. and Gast, J. and Hornler, B. and Wollmer, M. and Rigoll, G. and Hothker, A. and Konosu, H.",
TITLE = "Being bored? Recognising natural interest by extensive audiovisual
integration for real-life application",
JOURNAL = IVC,
VOLUME = "27",
YEAR = "2009",
NUMBER = "12",
MONTH = "November",
PAGES = "1760-1774",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283082"}
@inproceedings{bb288447,
AUTHOR = "Eyben, F. and Wollmer, M. and Valstar, M.F. and Gunes, H. and Schuller, B. and Pantic, M.",
TITLE = "String-based audiovisual fusion of behavioural events for the
assessment of dimensional affect",
BOOKTITLE = FG11,
YEAR = "2011",
PAGES = "322-329",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283083"}
@inproceedings{bb288448,
AUTHOR = "Althoff, F. and McGlaun, G. and Lang, M.K. and Rigoll, G.",
TITLE = "Evaluating Multimodal Interaction Patterns in Various Application
Scenarios",
BOOKTITLE = GW03,
YEAR = "2003",
PAGES = "421-435",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283084"}
@article{bb288449,
AUTHOR = "Casanovas, A.L. and Monaci, G. and Vandergheynst, P. and Gribonval, R.",
TITLE = "Blind Audiovisual Source Separation Based on Sparse Redundant
Representations",
JOURNAL = MultMed,
VOLUME = "12",
YEAR = "2010",
NUMBER = "5",
PAGES = "358-371",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283085"}
@inproceedings{bb288450,
AUTHOR = "Casanovas, A.L. and Monaci, G. and Vandergheynst, P.",
TITLE = "Blind Audiovisual Source Separation using Sparse Representations",
BOOKTITLE = ICIP07,
YEAR = "2007",
PAGES = "III: 301-304",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283086"}
@article{bb288451,
AUTHOR = "Esch, J.",
TITLE = "Audiovisual Information Fusion in Human-Computer Interfaces and
Intelligent Environments: A Survey",
JOURNAL = PIEEE,
VOLUME = "98",
YEAR = "2010",
NUMBER = "10",
MONTH = "October",
PAGES = "1690-1691",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283087"}
@article{bb288452,
AUTHOR = "Shivappa, S.T. and Trivedi, M.M. and Rao, B.D.",
TITLE = "Audiovisual Information Fusion in Human-Computer Interfaces and
Intelligent Environments: A Survey",
JOURNAL = PIEEE,
VOLUME = "98",
YEAR = "2010",
NUMBER = "10",
MONTH = "October",
PAGES = "1692-1715",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283088"}
@article{bb288453,
AUTHOR = "Claussen, H. and Rosca, J. and Damper, R.I.",
TITLE = "Signature extraction using mutual interdependencies",
JOURNAL = PR,
VOLUME = "44",
YEAR = "2011",
NUMBER = "3",
MONTH = "March",
PAGES = "650-661",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283089"}
@inproceedings{bb288454,
AUTHOR = "Higgins, J.E. and Damper, R.I.",
TITLE = "An HMM-Based Subband Processing Approach to Speaker Identification",
BOOKTITLE = AVBPA01,
YEAR = "2001",
PAGES = "169",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283090"}
@article{bb288455,
AUTHOR = "Petridis, S. and Pantic, M.",
TITLE = "Audiovisual Discrimination Between Speech and Laughter:
Why and When Visual Information Might Help",
JOURNAL = MultMed,
VOLUME = "13",
YEAR = "2011",
NUMBER = "2",
PAGES = "216-234",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283091"}
@article{bb288456,
AUTHOR = "Petridis, S. and Pantic, M.",
TITLE = "Prediction-Based Audiovisual Fusion for Classification of
Non-Linguistic Vocalisations",
JOURNAL = AffCom,
VOLUME = "7",
YEAR = "2016",
NUMBER = "1",
MONTH = "January",
PAGES = "45-58",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283092"}
@inproceedings{bb288457,
AUTHOR = "Petridis, S. and Pantic, M.",
TITLE = "Fusion of audio and visual cues for laughter detection",
BOOKTITLE = CIVR08,
YEAR = "2008",
PAGES = "329-338",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283093"}
@inproceedings{bb288458,
AUTHOR = "Petridis, S. and Pantic, M. and Cohn, J.F.",
TITLE = "Prediction-based classification for audiovisual discrimination between
laughter and speech",
BOOKTITLE = FG11,
YEAR = "2011",
PAGES = "619-626",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283094"}
@article{bb288459,
AUTHOR = "Moustakas, K. and Tzovaras, D. and Dybkjaer, L. and Bernsen, N. and Aran, O.",
TITLE = "Using Modality Replacement to Facilitate Communication between Visually
and Hearing-Impaired People",
JOURNAL = MultMedMag,
VOLUME = "18",
YEAR = "2011",
NUMBER = "2",
MONTH = "April",
PAGES = "26-37",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283095"}
@article{bb288460,
AUTHOR = "Tariquzzaman, M. and Kim, J.Y. and Na, S.Y. and Kim, H.G. and Har, D.S.",
TITLE = "A Visual Signal Reliability for Robust Audio-Visual Speaker
Identification",
JOURNAL = IEICE,
VOLUME = "E94-D",
YEAR = "2011",
NUMBER = "10",
MONTH = "October",
PAGES = "2052-2055",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283096"}
@article{bb288461,
AUTHOR = "Tiawongsombat, P. and Jeong, M.H. and Yun, J.S. and You, B.J. and Oh, S.R.",
TITLE = "Robust visual speakingness detection using bi-level HMM",
JOURNAL = PR,
VOLUME = "45",
YEAR = "2012",
NUMBER = "2",
MONTH = "February",
PAGES = "783-793",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283097"}
@article{bb288462,
AUTHOR = "Noulas, A. and Englebienne, G. and Krose, B.J.A.",
TITLE = "Multimodal Speaker Diarization",
JOURNAL = PAMI,
VOLUME = "34",
YEAR = "2012",
NUMBER = "1",
MONTH = "January",
PAGES = "79-93",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283098"}
@article{bb288463,
AUTHOR = "Minotto, V.P. and Jung, C.R. and Lee, B.",
TITLE = "Multimodal Multi-Channel On-Line Speaker Diarization Using Sensor
Fusion Through SVM",
JOURNAL = MultMed,
VOLUME = "17",
YEAR = "2015",
NUMBER = "10",
MONTH = "October",
PAGES = "1694-1705",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283099"}
@article{bb288464,
AUTHOR = "Nicolaou, M.A. and Gunes, H. and Pantic, M.",
TITLE = "Output-associative RVM regression for dimensional and continuous
emotion prediction",
JOURNAL = IVC,
VOLUME = "30",
YEAR = "2012",
NUMBER = "3",
MONTH = "March",
PAGES = "186-196",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283100"}
@inproceedings{bb288465,
AUTHOR = "Pantic, M. and Gunes, H. and Nicolaou, M.A.",
TITLE = "Output-associative RVM regression for dimensional and continuous
emotion prediction",
BOOKTITLE = FG11,
YEAR = "2011",
PAGES = "16-23",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283100"}
@inproceedings{bb288466,
AUTHOR = "Nicolaou, M.A. and Gunes, H. and Pantic, M.",
TITLE = "Designing frameworks for automatic affect prediction and classification
in dimensional space",
BOOKTITLE = Gesture11,
YEAR = "2011",
PAGES = "20-26",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283101"}
@article{bb288467,
AUTHOR = "Nicolaou, M.A. and Gunes, H. and Pantic, M.",
TITLE = "Continuous Prediction of Spontaneous Affect from Multiple Cues and
Modalities in Valence-Arousal Space",
JOURNAL = AffCom,
VOLUME = "2",
YEAR = "2011",
NUMBER = "2",
PAGES = "92-105",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283102"}
@inproceedings{bb288468,
AUTHOR = "Nicolaou, M.A. and Gunes, H. and Pantic, M.",
TITLE = "Audio-Visual Classification and Fusion of Spontaneous Affective Data in
Likelihood Space",
BOOKTITLE = ICPR10,
YEAR = "2010",
PAGES = "3695-3699",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283103"}
@article{bb288469,
AUTHOR = "Nicolaou, M.A. and Pavlovic, V. and Pantic, M.",
TITLE = "Dynamic Probabilistic CCA for Analysis of Affective Behavior and
Fusion of Continuous Annotations",
JOURNAL = PAMI,
VOLUME = "36",
YEAR = "2014",
NUMBER = "7",
MONTH = "July",
PAGES = "1299-1311",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283104"}
@inproceedings{bb288470,
AUTHOR = "Nicolaou, M.A. and Pavlovic, V. and Pantic, M.",
TITLE = "Dynamic Probabilistic CCA for Analysis of Affective Behaviour",
BOOKTITLE = ECCV12,
YEAR = "2012",
PAGES = "VII: 98-111",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283105"}
@article{bb288471,
AUTHOR = "Wang, L.J. and Qian, Y. and Scott, M.R. and Chen, G. and Soong, F.K.",
TITLE = "Computer-Assisted Audiovisual Language Learning",
JOURNAL = Computer,
VOLUME = "45",
YEAR = "2012",
NUMBER = "6",
MONTH = "June",
PAGES = "38-47",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283106"}
@article{bb288472,
AUTHOR = "Wu, Q.X. and Wang, Z.Y. and Deng, F.Q. and Chi, Z. and Feng, D.D.",
TITLE = "Realistic Human Action Recognition with
Multimodal Feature Selection and Fusion",
JOURNAL = SMCS,
VOLUME = "43",
YEAR = "2013",
NUMBER = "4",
PAGES = "875-885",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283107"}
@article{bb288473,
AUTHOR = "Wu, Q.X. and Wang, Z.Y. and Deng, F.Q. and Xia, Y. and Kang, W.X. and Feng, D.D.",
TITLE = "Discriminative two-level feature selection for realistic human action
recognition",
JOURNAL = JVCIR,
VOLUME = "24",
YEAR = "2013",
NUMBER = "7",
PAGES = "1064-1074",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283108"}
@inproceedings{bb288474,
AUTHOR = "Wu, Q.X. and Wang, Z.Y. and Deng, F.Q. and Feng, D.D.",
TITLE = "Realistic Human Action Recognition with Audio Context",
BOOKTITLE = DICTA10,
YEAR = "2010",
PAGES = "288-293",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283109"}
@inproceedings{bb288475,
AUTHOR = "Wu, Q.X. and Lu, S.Y. and Wang, Z.Y. and Deng, F.Q. and Kang, W.X. and Feng, D.D.",
TITLE = "Structure Context of Local Features in Realistic Human Action
Recognition",
BOOKTITLE = VECTaR11,
YEAR = "2011",
PAGES = "1496-1501",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283110"}
@article{bb288476,
AUTHOR = "Mirzaei, M.R. and Ghorshi, S. and Mortazavi, M.",
TITLE = "Audio-visual speech recognition techniques in augmented reality
environments",
JOURNAL = VC,
VOLUME = "30",
YEAR = "2014",
NUMBER = "3",
MONTH = "March",
PAGES = "245-257",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283111"}
@article{bb288477,
AUTHOR = "Bredin, H. and Roy, A. and Le, V.B. and Barras, C.",
TITLE = "Person instance graphs for mono-, cross- and multi-modal person
recognition in multimedia data: application to speaker identification
in TV broadcast",
JOURNAL = MultInfoRetr,
VOLUME = "3",
YEAR = "2014",
NUMBER = "3",
MONTH = "September",
PAGES = "161-175",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283112"}
@article{bb288478,
AUTHOR = "Ozasa, Y. and Nakano, M. and Ariki, Y. and Iwahashi, N.",
TITLE = "Discriminating Unknown Objects from Known Objects Using Image and
Speech Information",
JOURNAL = IEICE,
VOLUME = "E98-D",
YEAR = "2015",
NUMBER = "3",
MONTH = "March",
PAGES = "704-711",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283113"}
@inproceedings{bb288479,
AUTHOR = "Ozasa, Y. and Ariki, Y. and Nakano, M. and Iwahashi, N.",
TITLE = "Disambiguation in Unknown Object Detection by Integrating Image and
Speech Recognition Confidences",
BOOKTITLE = ACCV12,
YEAR = "2012",
PAGES = "I:85-96",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283114"}
@inproceedings{bb288480,
AUTHOR = "Nishimura, H. and Ozasa, Y. and Ariki, Y. and Nakano, M.",
TITLE = "Selection of Unknown Objects Specified by Speech Using Models
Constructed from Web Images",
BOOKTITLE = ICPR14,
YEAR = "2014",
PAGES = "477-482",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283115"}
@inproceedings{bb288481,
AUTHOR = "Nishimura, H. and Ozasa, Y. and Ariki, Y. and Nakano, M.",
TITLE = "Object Recognition by Integrated Information Using Web Images",
BOOKTITLE = ACPR13,
YEAR = "2013",
PAGES = "657-661",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283116"}
@inproceedings{bb288482,
AUTHOR = "Ozasa, Y. and Enami, N. and Ariki, Y.",
TITLE = "Color saliency for object identification",
BOOKTITLE = FCV15,
YEAR = "2015",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283117"}
@article{bb288483,
AUTHOR = "Harte, N. and Gillen, E.",
TITLE = "TCD-TIMIT: An Audio-Visual Corpus of Continuous Speech",
JOURNAL = MultMed,
VOLUME = "17",
YEAR = "2015",
NUMBER = "5",
MONTH = "May",
PAGES = "603-615",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283118"}
@article{bb288484,
AUTHOR = "Katsaggelos, A.K. and Bahaadini, S. and Molina, R.",
TITLE = "Audiovisual Fusion: Challenges and New Approaches",
JOURNAL = PIEEE,
VOLUME = "103",
YEAR = "2015",
NUMBER = "9",
MONTH = "September",
PAGES = "1635-1653",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283119"}
@article{bb288485,
AUTHOR = "Mezai, L. and Hachouf, F.",
TITLE = "Score-Level Fusion of Face and Voice Using Particle Swarm
Optimization and Belief Functions",
JOURNAL = HMS,
VOLUME = "45",
YEAR = "2015",
NUMBER = "6",
MONTH = "December",
PAGES = "761-772",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283120"}
@article{bb288486,
AUTHOR = "Wu, P. and Liu, H. and Li, X. and Fan, T. and Zhang, X.",
TITLE = "A Novel Lip Descriptor for Audio-Visual Keyword Spotting Based on
Adaptive Decision Fusion",
JOURNAL = MultMed,
VOLUME = "18",
YEAR = "2016",
NUMBER = "3",
MONTH = "March",
PAGES = "326-338",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283121"}
@article{bb288487,
AUTHOR = "Dilpazir, H. and Muhammad, Z. and Minhas, Q. and Ahmed, F. and Malik, H. and Mahmood, H.",
TITLE = "Multivariate mutual information for audio video fusion",
JOURNAL = SIViP,
VOLUME = "10",
YEAR = "2016",
NUMBER = "7",
MONTH = "October",
PAGES = "1265-1272",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283122"}
@article{bb288488,
AUTHOR = "Beyan, C. and Capozzi, F. and Becchio, C. and Murino, V.",
TITLE = "Prediction of the Leadership Style of an Emergent Leader Using Audio
and Visual Nonverbal Features",
JOURNAL = MultMed,
VOLUME = "20",
YEAR = "2018",
NUMBER = "2",
MONTH = "February",
PAGES = "441-456",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283123"}
@article{bb288489,
AUTHOR = "Fernandez Lopez, A. and Sukno, F.M.",
TITLE = "Survey on automatic lip-reading in the era of deep learning",
JOURNAL = IVC,
VOLUME = "78",
YEAR = "2018",
PAGES = "53-72",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283124"}
@article{bb288490,
AUTHOR = "Stafylakis, T. and Khan, M.H. and Tzimiropoulos, G.",
TITLE = "Pushing the boundaries of audiovisual word recognition using Residual
Networks and LSTMs",
JOURNAL = CVIU,
VOLUME = "176-177",
YEAR = "2018",
PAGES = "22-32",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283125"}
@inproceedings{bb288491,
AUTHOR = "Stafylakis, T. and Tzimiropoulos, G.",
TITLE = "Zero-Shot Keyword Spotting for Visual Speech Recognition In-the-wild",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "II: 536-552",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283126"}
@article{bb288492,
AUTHOR = "Liu, X. and Geng, J.J. and Ling, H.B. and Cheung, Y.M.",
TITLE = "Attention guided deep audio-face fusion for efficient speaker naming",
JOURNAL = PR,
VOLUME = "88",
YEAR = "2019",
PAGES = "557-568",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283127"}
@article{bb288493,
AUTHOR = "Tsiami, A. and Koutras, P. and Katsamanis, A. and Vatakis, A. and Maragos, P.",
TITLE = "A behaviorally inspired fusion approach for computational audiovisual
saliency modeling",
JOURNAL = SP:IC,
VOLUME = "76",
YEAR = "2019",
PAGES = "186-200",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283128"}
@article{bb288494,
AUTHOR = "Hsiao, S. and Sun, H. and Hsieh, M. and Tsai, M. and Tsao, Y. and Lee, C.",
TITLE = "Toward Automating Oral Presentation Scoring During Principal
Certification Program Using Audio-Video Low-Level Behavior Profiles",
JOURNAL = AffCom,
VOLUME = "10",
YEAR = "2019",
NUMBER = "4",
MONTH = "October",
PAGES = "552-567",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283129"}
@article{bb288495,
AUTHOR = "Ma, Y. and Hong, H. and Li, H. and Zhao, H. and Li, Y.S. and Sun, L. and Gu, C. and Zhu, X.H.",
TITLE = "Non-Contact Speech Recovery Technology Using a 24 GHz Portable
Auditory Radar and Webcam",
JOURNAL = RS,
VOLUME = "12",
YEAR = "2020",
NUMBER = "4",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283130"}
@inproceedings{bb288496,
AUTHOR = "Xu, B. and Wang, J. and Lu, C. and Guo, Y.",
TITLE = "Watch to Listen Clearly: Visual Speech Enhancement Driven
Multi-modality Speech Recognition",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1626-1635",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283131"}
@article{bb288497,
AUTHOR = "Tao, F. and Busso, C.",
TITLE = "End-to-End Audiovisual Speech Recognition System With Multitask
Learning",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "1-11",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283132"}
@article{bb288498,
AUTHOR = "Xu, J.H. and Zhang, B. and Wang, Z.Y. and Wang, Y. and Chen, F. and Gao, J.B. and Feng, D.D.",
TITLE = "Affective Audio Annotation of Public Speeches with Convolutional
Clustering Neural Network",
JOURNAL = AffCom,
VOLUME = "13",
YEAR = "2022",
NUMBER = "1",
MONTH = "January",
PAGES = "238-249",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283133"}
@article{bb288499,
AUTHOR = "Afouras, T. and Chung, J.S. and Senior, A. and Vinyals, O. and Zisserman, A.",
TITLE = "Deep Audio-Visual Speech Recognition",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "12",
MONTH = "December",
PAGES = "8717-8727",
BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT283134"}
Last update:Feb 26, 2026 at 10:58:24