@inproceedings{bb198200,
        AUTHOR = "Wang, X. and Huang, Q. and Celikyilmaz, A. and Gao, J.F. and Shen, D. and Wang, Y.F. and Wang, W.Y. and Zhang, L.",
        TITLE = "Reinforced Cross-Modal Matching and Self-Supervised Imitation Learning
for Vision-Language Navigation",
        BOOKTITLE = "CVPR19",
        YEAR = "2019",
        PAGES = "6622-6631",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193403"}

@inproceedings{bb198201,
        AUTHOR = "Niu, Y.L. and Zhang, H.W. and Zhang, M.L. and Zhang, J.H. and Lu, Z.W. and Wen, J.R.",
        TITLE = "Recursive Visual Attention in Visual Dialog",
        BOOKTITLE = "CVPR19",
        YEAR = "2019",
        PAGES = "6672-6681",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193404"}

@inproceedings{bb198202,
        AUTHOR = "Schwartz, I. and Schwing, A.G. and Hazan, T.",
        TITLE = "A Simple Baseline for Audio-Visual Scene-Aware Dialog",
        BOOKTITLE = "CVPR19",
        YEAR = "2019",
        PAGES = "12540-12550",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193405"}

@inproceedings{bb198203,
        AUTHOR = "Lu, Y. and Lee, H. and Tseng, H. and Yang, M.",
        TITLE = "Self-Supervised Audio Spatialization with Correspondence Classifier",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3347-3351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193406"}

@inproceedings{bb198204,
        AUTHOR = "Liu, H. and Li, Y. and Yang, B.",
        TITLE = "3D Audio-Visual Speaker Tracking with A Two-Layer Particle Filter",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1955-1959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193407"}

@inproceedings{bb198205,
        AUTHOR = "Saidi, I. and Zhang, L. and Barriac, V. and Deforges, O.",
        TITLE = "Laboratory and Crowdsourcing Studies of Lip Sync Effect on the
Audio-Video Quality Assessment for Videoconferencing Application",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3207-3211",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193408"}

@inproceedings{bb198206,
        AUTHOR = "Meng, D. and Peng, X. and Wang, K. and Qiao, Y.",
        TITLE = "Frame Attention Networks for Facial Expression Recognition in Videos",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3866-3870",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193409"}

@inproceedings{bb198207,
        AUTHOR = "Shahid, M. and Beyan, C. and Murino, V.",
        TITLE = "Comparisons of Visual Activity Primitives for Voice Activity Detection",
        BOOKTITLE = CIAP19,
        YEAR = "2019",
        PAGES = "I:48-59",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193410"}

@inproceedings{bb198208,
        AUTHOR = "Kim, C.I. and Shin, H.J.V. and Oh, T.H. and Kaspar, A. and Elgharib, M. and Matusik, W.",
        TITLE = "On Learning Associations of Faces and Voices",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "V:276-292",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193411"}

@inproceedings{bb198209,
        AUTHOR = "Schindler, A. and Boyer, M. and Lindley, A. and Schreiber, D. and Philipp, T.",
        TITLE = "Large Scale Audio-Visual Video Analytics Platform for Forensic
Investigations of Terroristic Attacks",
        BOOKTITLE = "MMMod19",
        YEAR = "2019",
        PAGES = "II:106-119",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193412"}

@inproceedings{bb198210,
        AUTHOR = "Oliveira, D.A.B. and Mattos, A.B. and da Silva Morais, E.",
        TITLE = "Improving Viseme Recognition Using GAN-Based Frontal View Mapping",
        BOOKTITLE = AMFG18,
        YEAR = "2018",
        PAGES = "2229-22297",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193413"}

@inproceedings{bb198211,
        AUTHOR = "Yang, X. and Molchanov, P. and Kautz, J.",
        TITLE = "Making Convolutional Networks Recurrent for Visual Sequence Learning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6469-6478",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193414"}

@inproceedings{bb198212,
        AUTHOR = "Zhang, J. and Richmond, K. and Fisher, R.B.",
        TITLE = "Dual-modality Talking-metrics: 3D Visual-Audio Integrated
Behaviometric Cues from Speakers",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3144-3149",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193415"}

@inproceedings{bb198213,
        AUTHOR = "Chowdhury, A. and Atoum, Y. and Tran, L. and Liu, X. and Ross, A.",
        TITLE = "MSU-AVIS dataset: Fusing Face and Voice Modalities for Biometric
Recognition in Indoor Surveillance Videos",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3567-3573",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193416"}

@inproceedings{bb198214,
        AUTHOR = "Nagrani, A. and Albanie, S. and Zisserman, A.",
        TITLE = "Seeing Voices and Hearing Faces: Cross-Modal Biometric Matching",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "8427-8436",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193417"}

@inproceedings{bb198215,
        AUTHOR = "Saitoh, T. and Kubokawa, M.",
        TITLE = "SSSD: Speech Scene database by Smart Device for Visual Speech
Recognition",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3228-3232",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193418"}

@inproceedings{bb198216,
        AUTHOR = "Owens, A. and Efros, A.A.",
        TITLE = "Audio-Visual Scene Analysis with Self-Supervised Multisensory Features",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 639-658",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193419"}

@inproceedings{bb198217,
        AUTHOR = "Berlin, A.A. and Surati, R.",
        TITLE = "Video Deconfounding: Hearing-Aid Inspired Video Enhancement",
        BOOKTITLE = IVMSP18,
        YEAR = "2018",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193420"}

@inproceedings{bb198218,
        AUTHOR = "Ding, R. and Pang, C. and Liu, H.",
        TITLE = "Audio-Visual Keyword Spotting Based on Multidimensional Convolutional
Neural Network",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "4138-4142",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193421"}

@inproceedings{bb198219,
        AUTHOR = "Liao, J. and Wang, S. and Zhang, X. and Liu, G.",
        TITLE = "3D Convolutional Neural Networks Based Speaker Identification and
Authentication",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2042-2046",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193422"}

@inproceedings{bb198220,
        AUTHOR = "Savran, A. and Tavarone, R. and Higy, B. and Badino, L. and Bartolozzi, C.",
        TITLE = "Energy and Computation Efficient Audio-Visual Voice Activity
Detection Driven by Event-Cameras",
        BOOKTITLE = FG18,
        YEAR = "2018",
        PAGES = "333-340",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193423"}

@inproceedings{bb198221,
        AUTHOR = "Ephrat, A. and Halperin, T. and Peleg, S.",
        TITLE = "Improved Speech Reconstruction from Silent Video",
        BOOKTITLE = CVAVM17,
        YEAR = "2017",
        PAGES = "455-462",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193424"}

@inproceedings{bb198222,
        AUTHOR = "Ban, Y. and Girin, L. and Alameda Pineda, X. and Horaud, R.",
        TITLE = "Exploiting the Complementarity of Audio and Visual Data in
Multi-speaker Tracking",
        BOOKTITLE = CVAVM17,
        YEAR = "2017",
        PAGES = "446-454",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193425"}

@inproceedings{bb198223,
        AUTHOR = "Le, N. and Heili, A. and Wu, D. and Odobez, J.M.",
        TITLE = "Temporally subsampled detection for accurate and efficient face
tracking and diarization",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "1792-1797",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193426"}

@inproceedings{bb198224,
        AUTHOR = "Ahn, J. and Kim, Y.J. and Kim, D.J.",
        TITLE = "Patch-based visual microphone for improving quality of sound",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "3927-3932",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193427"}

@inproceedings{bb198225,
        AUTHOR = "Chung, J.S. and Zisserman, A.",
        TITLE = "Out of Time: Automated Lip Sync in the Wild",
        BOOKTITLE = LipRead16,
        YEAR = "2016",
        PAGES = "II: 251-263",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193428"}

@inproceedings{bb198226,
        AUTHOR = "Miao, C.L. and Feng, J.W. and Ding, Y. and Yang, Y. and Chen, X.G. and Ji, X.Y.",
        TITLE = "Unsupervised person clustering in videos with cross-modal
communication",
        BOOKTITLE = VCIP16,
        YEAR = "2016",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193429"}

@inproceedings{bb198227,
        AUTHOR = "Hu, D. and Li, X.L. and Lu, X.Q.",
        TITLE = "Temporal Multimodal Learning in Audiovisual Speech Recognition",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "3574-3582",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193430"}

@inproceedings{bb198228,
        AUTHOR = "Liu, H. and Fan, T. and Wu, P.P.",
        TITLE = "Audio-visual Keyword Spotting for Mandarin Based on Discriminative
Local Spatial-Temporal Descriptors",
        BOOKTITLE = ICPR14,
        YEAR = "2014",
        PAGES = "785-790",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193431"}

@inproceedings{bb198229,
        AUTHOR = "Ringeval, F. and Sonderegger, A. and Sauer, J. and Lalanne, D.",
        TITLE = "Introducing the RECOLA multimodal corpus of remote collaborative and
affective interactions",
        BOOKTITLE = FG13,
        YEAR = "2013",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193432"}

@inproceedings{bb198230,
        AUTHOR = "Aubrey, A.J. and Cunningham, D.W. and Marshall, D. and Rosin, P.L. and Shin, A.",
        TITLE = "The Face Speaks:
Contextual and Temporal Sensitivity to Backchannel Responses",
        BOOKTITLE = FaceCVHum12,
        YEAR = "2012",
        PAGES = "II:248-259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193433"}

@inproceedings{bb198231,
        AUTHOR = "Tawari, A. and Trivedi, M.",
        TITLE = "Audio-visual data association for face expression analysis",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "1120-1123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193434"}

@inproceedings{bb198232,
        AUTHOR = "Taj, M. and Cavallaro, A.",
        TITLE = "Interaction recognition in wide areas using audiovisual sensors",
        BOOKTITLE = ICIP12,
        YEAR = "2012",
        PAGES = "1113-1116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193435"}

@inproceedings{bb198233,
        AUTHOR = "Giorgolo, G.",
        TITLE = "Integration of Gesture and Verbal Language: A Formal Semantics Approach",
        BOOKTITLE = GW11,
        YEAR = "2011",
        PAGES = "216-227",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193436"}

@inproceedings{bb198234,
        AUTHOR = "Le, Q.A. and Pelachaud, C.",
        TITLE = "Generating Co-speech Gestures for the Humanoid Robot NAO through BML",
        BOOKTITLE = GW11,
        YEAR = "2011",
        PAGES = "228-237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193437"}

@inproceedings{bb198235,
        AUTHOR = "Saeed, A. and Al Hamadi, A. and Heuer, M.",
        TITLE = "Speaker Tracking Using Multi-modal Fusion Framework",
        BOOKTITLE = ICISP12,
        YEAR = "2012",
        PAGES = "539-546",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193438"}

@inproceedings{bb198236,
        AUTHOR = "Navarathna, R. and Dean, D. and Sridharan, S. and Fookes, C. and Lucey, P.",
        TITLE = "Visual Voice Activity Detection Using Frontal versus Profile Views",
        BOOKTITLE = DICTA11,
        YEAR = "2011",
        PAGES = "134-139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193439"}

@inproceedings{bb198237,
        AUTHOR = "Komai, Y. and Ariki, Y. and Takiguchi, T.",
        TITLE = "Audio-Visual Speech Recognition Based on AAM Parameter and Phoneme
Analysis of Visual Feature",
        BOOKTITLE = PSIVT11,
        YEAR = "2011",
        PAGES = "I: 97-108",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193440"}

@inproceedings{bb198238,
        AUTHOR = "Zheng, H.M. and Wang, M. and Li, Z.",
        TITLE = "Audio-visual speaker identification with multi-view distance metric
learning",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "4561-4564",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193441"}

@inproceedings{bb198239,
        AUTHOR = "Krishnan, R.K. and Sarkar, S.",
        TITLE = "Similarity Measure between Two Gestures Using Triplets",
        BOOKTITLE = HAU3D13,
        YEAR = "2013",
        PAGES = "506-513",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193442"}

@inproceedings{bb198240,
        AUTHOR = "Krishnan, R.K. and Sarkar, S.",
        TITLE = "Detecting Group Turn Patterns in Conversations Using Audio-Video Change
Scale-Space",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "137-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193443"}

@inproceedings{bb198241,
        AUTHOR = "Aran, O. and Gatica Perez, D.",
        TITLE = "Fusing Audio-Visual Nonverbal Cues to Detect Dominant People in Group
Conversations",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "3687-3690",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193444"}

@inproceedings{bb198242,
        AUTHOR = "Niese, R. and Al Hamadi, A. and Michaelis, B.",
        TITLE = "A New Multi-camera Based Facial Expression Analysis Concept",
        BOOKTITLE = ICIAR12,
        YEAR = "2012",
        PAGES = "II: 64-71",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193445"}

@inproceedings{bb198243,
        AUTHOR = "Steer, M.A. and Al Hamadi, A. and Michaelis, B.",
        TITLE = "Audio-Visual Data Fusion Using a Particle Filter in the Application of
Face Recognition",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4392-4395",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193446"}

@inproceedings{bb198244,
        AUTHOR = "Roy, A. and Marcel, S.",
        TITLE = "Crossmodal Matching of Speakers Using Lip and Voice Features in
Temporally Non-overlapping Audio and Video Streams",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4504-4507",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193447"}

@inproceedings{bb198245,
        AUTHOR = "Cour, T. and Sapp, B. and Nagle, A. and Taskar, B.",
        TITLE = "Talking pictures:
Temporal grouping and dialog-supervised person recognition",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "1014-1021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193448"}

@inproceedings{bb198246,
        AUTHOR = "Wu, G.Y. and Zhu, J. and Xu, H.H.",
        TITLE = "A hybrid visual feature extraction method for audio-visual speech
recognition",
        BOOKTITLE = ICIP09,
        YEAR = "2009",
        PAGES = "1829-1832",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193449"}

@inproceedings{bb198247,
        AUTHOR = "Ceballos, A. and Gomez, J. and Prieto, F. and Redarce, T.",
        TITLE = "Robot Command Interface Using an Audio-Visual Speech Recognition System",
        BOOKTITLE = CIARP09,
        YEAR = "2009",
        PAGES = "869-876",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193450"}

@inproceedings{bb198248,
        AUTHOR = "Cifani, S. and Abel, A. and Hussain, A. and Squartini, S. and Piazza, F.",
        TITLE = "An Investigation into Audiovisual Speech Correlation in Reverberant
Noisy Environments",
        BOOKTITLE = COST08,
        YEAR = "2008",
        PAGES = "331-343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193451"}

@inproceedings{bb198249,
        AUTHOR = "Fanelli, G. and Gall, J. and Van Gool, L.J.",
        TITLE = "Hough transform-based mouth localization for audio-visual speech
recognition",
        BOOKTITLE = BMVC09,
        YEAR = "2009",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193452"}

@inproceedings{bb198250,
        AUTHOR = "Cadavid, S. and Abdel Mottaleb, M. and Messinger, D.S. and Mahoor, M.H. and Bahrick, L.E.",
        TITLE = "Detecting local audio-visual synchrony in monologues utilizing vocal
pitch and facial landmark trajectories",
        BOOKTITLE = BMVC09,
        YEAR = "2009",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193453"}

@inproceedings{bb198251,
        AUTHOR = "Lee, J.S. and Ebrahimi, T.",
        TITLE = "Two-Level Bimodal Association for Audio-Visual Speech Recognition",
        BOOKTITLE = ACIVS09,
        YEAR = "2009",
        PAGES = "133-144",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193454"}

@inproceedings{bb198252,
        AUTHOR = "Marchegiani, M.L. and Pirri, F. and Pizzoli, M.",
        TITLE = "Multimodal Speaker Recognition in a Conversation Scenario",
        BOOKTITLE = CVS09,
        YEAR = "2009",
        PAGES = "11-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193455"}

@inproceedings{bb198253,
        AUTHOR = "Kumar, K. and Navratil, J. and Marcheret, E. and Libal, V. and Ramaswamy, G. and Potamianos, G.",
        TITLE = "Audio-visual speech synchronization detection using a bimodal linear
prediction model",
        BOOKTITLE = Biometrics09,
        YEAR = "2009",
        PAGES = "53-59",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193456"}

@inproceedings{bb198254,
        AUTHOR = "Karam, W. and Mokbel, C. and Greige, H. and Chollet, G.",
        TITLE = "Audio-Visual Identity Verification and Robustness to Imposture",
        BOOKTITLE = ICB09,
        YEAR = "2009",
        PAGES = "796-805",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193457"}

@inproceedings{bb198255,
        AUTHOR = "Rebillat, M. and Katz, B.F.G. and Corteel, E.",
        TITLE = "SMART-I2: Spatial Multi-user Audio-visual Real-time interactive
interface, A broadcast application context",
        BOOKTITLE = "3DTV09",
        YEAR = "2009",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193458"}

@inproceedings{bb198256,
        AUTHOR = "Eisenstein, J.",
        TITLE = "Gesture in Automatic Discourse Processing",
        BOOKTITLE = CSAIL,
        YEAR = "2008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193459"}

@inproceedings{bb198257,
        AUTHOR = "Eisenstein, J.",
        TITLE = "Gesture in Automatic Discourse Processing",
        BOOKTITLE = Ph.D.,
        YEAR = "2008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193459"}

@inproceedings{bb198258,
        AUTHOR = "Das, A. and Manyam, O.K. and Tapaswi, M.",
        TITLE = "Audio-Visual Person Authentication with Multiple Visualized-Speech
Features and Multiple Face Profiles",
        BOOKTITLE = ICCVGIP08,
        YEAR = "2008",
        PAGES = "39-46",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193460"}

@inproceedings{bb198259,
        AUTHOR = "Cao, Y. and Baang, S. and Liu, S.H. and Li, M. and Hu, S.Q.",
        TITLE = "Audio-visual event classification via spatial-temporal-audio words",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193461"}

@inproceedings{bb198260,
        AUTHOR = "Terry, L.H. and Shiell, D.J. and Katsaggelos, A.K.",
        TITLE = "Feature space video stream consistency estimation for dynamic stream
weighting in audio-visual speech recognition",
        BOOKTITLE = ICIP08,
        YEAR = "2008",
        PAGES = "1316-1319",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193462"}

@inproceedings{bb198261,
        AUTHOR = "Naseem, I. and Mian, A.S.",
        TITLE = "User Verification by Combining Speech and Face Biometrics in Video",
        BOOKTITLE = ISVC08,
        YEAR = "2008",
        PAGES = "II: 482-492",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193463"}

@inproceedings{bb198262,
        AUTHOR = "Ettinger, E. and Freund, Y.",
        TITLE = "Coordinate-free calibration of an acoustically driven camera pointing
system",
        BOOKTITLE = ICDSC08,
        YEAR = "2008",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193464"}

@inproceedings{bb198263,
        AUTHOR = "Hung, H. and Friedland, G.",
        TITLE = "Towards Audio-Visual On-line Diarization Of Participants In Group
Meetings",
        BOOKTITLE = M2SFA208,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193465"}

@inproceedings{bb198264,
        AUTHOR = "Liu, Y. and Sato, Y.",
        TITLE = "Finding Speaker Face Region by Audiovisual Correlation",
        BOOKTITLE = M2SFA208,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193466"}

@inproceedings{bb198265,
        AUTHOR = "Kelly, D. and Pitie, F. and Kokaram, A. and Boland, F.",
        TITLE = "A Comparative Error Analysis of Audio-Visual Source Localization",
        BOOKTITLE = M2SFA208,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193467"}

@inproceedings{bb198266,
        AUTHOR = "Katsarakis, N. and Talantzis, F. and Pnevmatikakis, A. and Polymenakos, L.",
        TITLE = "The AIT 3D Audio / Visual Person Tracker for CLEAR 2007",
        BOOKTITLE = MTPH07,
        YEAR = "2007",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193468"}

@inproceedings{bb198267,
        AUTHOR = "Pachoud, S. and Gong, S. and Cavallaro, A.",
        TITLE = "Video Augmentation for Improving Audio Speech Recognition under Noise",
        BOOKTITLE = BMVC08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193469"}

@inproceedings{bb198268,
        AUTHOR = "Horii, Y. and Kawashima, H. and Matsuyama, T.",
        TITLE = "Speaker detection using the timing structure of lip motion and sound",
        BOOKTITLE = CVPR4HB08,
        YEAR = "2008",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193470"}

@inproceedings{bb198269,
        AUTHOR = "Rua, E.A. and Castro, J.L.A. and Mateo, C.G.",
        TITLE = "Quality-Based Score Normalization for Audiovisual Person Authentication",
        BOOKTITLE = ICIAR08,
        YEAR = "2008",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193471"}

@inproceedings{bb198270,
        AUTHOR = "Wang, L. and Tjondrongoro, D. and Liu, Y.",
        TITLE = "Clustering and Visualizing Audio-Visual Dataset on Mobile Devices in a
Topic-Oriented Manner",
        BOOKTITLE = Visual07,
        YEAR = "2007",
        PAGES = "310-321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193472"}

@inproceedings{bb198271,
        AUTHOR = "Zajdel, W. and Krijnders, J.D. and Andringa, T. and Gavrila, D.M.",
        TITLE = "CASSANDRA: audio-video sensor fusion for aggression detection",
        BOOKTITLE = AVSBS07,
        YEAR = "2007",
        PAGES = "200-205",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193473"}

@inproceedings{bb198272,
        AUTHOR = "Stodle, D. and Bjorndalen, J.M. and Anshus, O.J.",
        TITLE = "A System for Hybrid Vision- and Sound-Based Interaction with Distal and
Proximal Targets on Wall-Sized, High-Resolution Tiled Displays",
        BOOKTITLE = CVHCI07,
        YEAR = "2007",
        PAGES = "59-68",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193474"}

@inproceedings{bb198273,
        AUTHOR = "van Hengel, P.W.J. and Andringa, T.C.",
        TITLE = "Verbal aggression detection in complex social environments",
        BOOKTITLE = AVSBS07,
        YEAR = "2007",
        PAGES = "15-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193475"}

@inproceedings{bb198274,
        AUTHOR = "Ikeda, O.",
        TITLE = "Detection of a Speaker in Video by Combined Analysis of Speech Sound
and Mouth Movement",
        BOOKTITLE = ISVC07,
        YEAR = "2007",
        PAGES = "II: 602-610",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193476"}

@inproceedings{bb198275,
        AUTHOR = "Das, A.",
        TITLE = "Audio Visual Person Authentication by Multiple Nearest Neighbor
Classifiers",
        BOOKTITLE = ICB07,
        YEAR = "2007",
        PAGES = "1114-1123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193477"}

@inproceedings{bb198276,
        AUTHOR = "Xin, L. and Tao, J.H. and Tan, T.N.",
        TITLE = "Dynamic Audio-Visual Mapping using Fused Hidden Markov Model Inversion
Method",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "III: 293-296",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193478"}

@inproceedings{bb198277,
        AUTHOR = "Barzelay, Z. and Schechner, Y.Y.",
        TITLE = "Harmony in Motion",
        BOOKTITLE = CVPR07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193479"}

@inproceedings{bb198278,
        AUTHOR = "O'Donovan, A. and Duraiswami, R. and Neumann, J.",
        TITLE = "Microphone Arrays as Generalized Cameras for Integrated Audio Visual
Processing",
        BOOKTITLE = CVPR07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193480"}

@inproceedings{bb198279,
        AUTHOR = "Abbas, J. and Dagli, C.K. and Huang, T.S.",
        TITLE = "A Multimodality Framework for Creating Speaker/Non-Speaker Profile
Databases for Real-World Video",
        BOOKTITLE = SLAM07,
        YEAR = "2007",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193481"}

@inproceedings{bb198280,
        AUTHOR = "Kushal, A. and Rahurkar, M. and Fei Fei, L. and Ponce, J. and Huang, T.",
        TITLE = "Audio-Visual Speaker Localization Using Graphical Models",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "I: 291-294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193482"}

@inproceedings{bb198281,
        AUTHOR = "Tsuji, T. and Yamamoto, K. and Ishii, I.",
        TITLE = "Real-time Sound Source Localization Based on Audiovisual Frequency
Integration",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "IV: 322-325",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193483"}

@inproceedings{bb198282,
        AUTHOR = "Monaci, G. and Vandergheynst, P.",
        TITLE = "Audiovisual Gestalts",
        BOOKTITLE = PercOrg06,
        YEAR = "2006",
        PAGES = "200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193484"}

@inproceedings{bb198283,
        AUTHOR = "Zhu, Z.G. and Li, W.H. and Molina, E. and Wolberg, G.",
        TITLE = "LDV Sensing and Processing for Remote Hearing in a Multimodal
Surveillance System",
        BOOKTITLE = MSCSAS07,
        YEAR = "2007",
        PAGES = "1-2",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193485"}

@inproceedings{bb198284,
        AUTHOR = "Zhu, Z.G. and Li, W.H. and Wolberg, G.",
        TITLE = "Integrating LDV Audio and IR Video for Remote Multimodal Surveillance",
        BOOKTITLE = OTCBVS05,
        YEAR = "2005",
        PAGES = "III: 10-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193486"}

@inproceedings{bb198285,
        AUTHOR = "Wu, Z.Y. and Cai, L.H. and Meng, H.",
        TITLE = "Multi-level Fusion of Audio and Visual Features for Speaker
Identification",
        BOOKTITLE = ICB06,
        YEAR = "2006",
        PAGES = "493-499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193487"}

@inproceedings{bb198286,
        AUTHOR = "Yang, P. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Exploiting Glottal Information in Speaker Recognition Using Parallel
GMMs",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "804",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193488"}

@inproceedings{bb198287,
        AUTHOR = "Lei, Z.C.",
        TITLE = "Combining the Likelihood and the Kullback-Leibler Distance in
Estimating the Universal Background Model for Speaker Verification
Using SVM",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4553-4556",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193489"}

@inproceedings{bb198288,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "An UBM-Based Reference Space for Speaker Recognition",
        BOOKTITLE = ICPR06,
        YEAR = "2006",
        PAGES = "IV: 318-321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193490"}

@inproceedings{bb198289,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Constructing the Discriminative Kernels Using GMM for Text-Independent
Speaker Identification",
        BOOKTITLE = IWBRS05,
        YEAR = "2005",
        PAGES = "165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193491"}

@inproceedings{bb198290,
        AUTHOR = "Lei, Z.C. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Speaker Identification Using the VQ-Based Discriminative Kernels",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "797",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193492"}

@inproceedings{bb198291,
        AUTHOR = "Li, D.D. and Yang, Y.C. and Wu, Z.H.",
        TITLE = "Dynamic Bayesian Networks for Audio-Visual Speaker Recognition",
        BOOKTITLE = ICB06,
        YEAR = "2006",
        PAGES = "539-545",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193493"}

@inproceedings{bb198292,
        AUTHOR = "Megherbi, N. and Ambellouis, S. and Colot, O. and Cabestaing, F.",
        TITLE = "Data Association in Multi-Target Tracking Using Belief Theory:
Handling Target Emergence and Disappearance Issue",
        BOOKTITLE = AVSBS05,
        YEAR = "2005",
        PAGES = "517-521",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193494"}

@inproceedings{bb198293,
        AUTHOR = "Megherbi, N. and Ambellouis, S. and Colot, O. and Cabestaing, F.",
        TITLE = "Joint audio-video people tracking using belief theory",
        BOOKTITLE = AVSBS05,
        YEAR = "2005",
        PAGES = "135-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193495"}

@inproceedings{bb198294,
        AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.",
        TITLE = "VALID:
A New Practical Audio-Visual Database, and Comparative Results",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "777",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193496"}

@book{bb198295,
        AUTHOR = "Sharma, P. and Reilly, R.B.",
        TITLE = "The UCD Colour Face Image Database for Face Detection",
        PUBLISHER = "Online",
        YEAR = "1998",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193497"}

@inproceedings{bb198296,
        AUTHOR = "Fox, N.A. and O'Mullane, B.A. and Reilly, R.B.",
        TITLE = "Audio-Visual Speaker Identification via Adaptive Fusion Using
Reliability Estimates of Both Modalities",
        BOOKTITLE = AVBPA05,
        YEAR = "2005",
        PAGES = "787",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193498"}

@inproceedings{bb198297,
        AUTHOR = "Li, X. and Sun, L. and Tao, L.M. and Xu, G.Y. and Jia, Y.",
        TITLE = "A Speaker Tracking Algorithm Based on Audio and Visual Information
Fusion Using Particle Filter",
        BOOKTITLE = ICIAR04,
        YEAR = "2004",
        PAGES = "II: 572-580",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193499"}

@inproceedings{bb198298,
        AUTHOR = "Zhang, D. and Ghobakhlou, A. and Kasabov, N.",
        TITLE = "An adaptive model of person identification combining speech and image
information",
        BOOKTITLE = ICARCV04,
        YEAR = "2004",
        PAGES = "I: 413-418",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193500"}

@inproceedings{bb198299,
        AUTHOR = "Kratt, J. and Metze, F. and Stiefelhagen, R. and Waibel, A.",
        TITLE = "Large Vocabulary Audio-Visual Speech Recognition Using the Janus Speech
Recognition Toolkit",
        BOOKTITLE = DAGM04,
        YEAR = "2004",
        PAGES = "488-495",
        BIBSOURCE = "http://www.visionbib.com/bibliography/people916.html#TT193501"}

Last update:Aug 4, 2020 at 13:31:31