@inproceedings{bb198600, AUTHOR = "Walmer, M. and Sikka, K. and Sur, I. and Shrivastava, A. and Jha, S.", TITLE = "Dual-Key Multimodal Backdoors for Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "15354-15364", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193801"} @inproceedings{bb198601, AUTHOR = "Jing, C.C. and Jia, Y.D. and Wu, Y.W. and Liu, X.Y. and Wu, Q.", TITLE = "Maintaining Reasoning Consistency in Compositional Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "5089-5098", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193802"} @inproceedings{bb198602, AUTHOR = "Ding, Y. and Yu, J. and Liu, B. and Hu, Y. and Cui, M.X. and Wu, Q.", TITLE = "MuKEA: Multimodal Knowledge Extraction and Accumulation for Knowledge-based Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "5079-5088", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193803"} @inproceedings{bb198603, AUTHOR = "Cascante Bonilla, P. and Wu, H. and Wang, L. and Feris, R. and Ordonez, V.", TITLE = "Sim VQA: Exploring Simulated Environments for Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "5046-5056", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193804"} @inproceedings{bb198604, AUTHOR = "Gao, F. and Ping, Q. and Thattai, G. and Reganti, A. and Wu, Y.N. and Natarajan, P.", TITLE = "Transform-Retrieve-Generate: Natural Language-Centric Outside-Knowledge Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "5057-5067", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193805"} @inproceedings{bb198605, AUTHOR = "Gupta, V. and Li, Z. and Kortylewski, A. and Zhang, C. and Li, Y. and Yuille, A.L.", TITLE = "SwapMix: Diagnosing and Regularizing the Over-Reliance on Visual Context in Visual Question Answering", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "5068-5078", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193806"} @inproceedings{bb198606, AUTHOR = "Aflalo, E. and Du, M. and Tseng, S.Y. and Liu, Y.F. and Wu, C. and Duan, N. and Lal, V.", TITLE = "VL-InterpreT: An Interactive Visualization Tool for Interpreting Vision-Language Transformers", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "21374-21383", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193807"} @inproceedings{bb198607, AUTHOR = "Burghouts, G.J. and Huizinga, W.", TITLE = "Coarse-to-Fine Visual Question Answering by Iterative, Conditional Refinement", BOOKTITLE = CIAP22, YEAR = "2022", PAGES = "II:418-428", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193808"} @inproceedings{bb198608, AUTHOR = "Li, Z.W. and Stengel Eskin, E. and Zhang, Y.X. and Xie, C. and Tran, Q. and van Durme, B. and Yuille, A.L.", TITLE = "Calibrating Concepts and Operations: Towards Symbolic Reasoning on Real Images", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "14890-14899", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193809"} @inproceedings{bb198609, AUTHOR = "Kant, Y. and Moudgil, A. and Batra, D. and Parikh, D. and Agrawal, H.", TITLE = "Contrast and Classify: Training Robust VQA Models", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1584-1593", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193810"} @inproceedings{bb198610, AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Huang, Q.M. and Tian, Q.", TITLE = "Greedy Gradient Ensemble for Robust Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1564-1573", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193811"} @inproceedings{bb198611, AUTHOR = "Dancette, C. and Cadene, R. and Teney, D. and Cord, M.", TITLE = "Beyond Question-Based Biases: Assessing Multimodal Shortcut Learning in Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1554-1563", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193812"} @inproceedings{bb198612, AUTHOR = "Zhou, Y. and Ren, T. and Zhu, C.Y. and Sun, X.S. and Liu, J.Z. and Ding, X.H. and Xu, M.L. and Ji, R.R.", TITLE = "TRAR: Routing the Attention Spans in Transformer for Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "2054-2064", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193813"} @inproceedings{bb198613, AUTHOR = "Yang, X. and Gao, C.Y. and Zhang, H.W. and Cai, J.F.", TITLE = "Auto-Parsing Network for Image Captioning and Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "2177-2187", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193814"} @inproceedings{bb198614, AUTHOR = "Banerjee, P. and Gokhale, T. and Yang, Y.Z. and Baral, C.", TITLE = "Weakly Supervised Relative Spatial Reasoning for Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1888-1898", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193815"} @inproceedings{bb198615, AUTHOR = "Cao, Q.X. and Wan, W.T. and Wang, K. and Liang, X.D. and Lin, L.", TITLE = "Linguistically Routing Capsule Network for Out-of-distribution Visual Question Answering", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "1594-1603", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193816"} @inproceedings{bb198616, AUTHOR = "Li, L.J. and Lei, J. and Gan, Z. and Liu, J.J.", TITLE = "Adversarial VQA: A New Benchmark for Evaluating the Robustness of VQA Models", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "2022-2031", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193817"} @inproceedings{bb198617, AUTHOR = "Askarian, N. and Abbasnejad, E. and Zukerman, I. and Buntine, W. and Haffari, G.", TITLE = "Inductive Biases for Low Data VQA: A Data Augmentation Approach", BOOKTITLE = Novelty22, YEAR = "2022", PAGES = "231-240", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193818"} @inproceedings{bb198618, AUTHOR = "Mathew, M. and Bagal, V. and Tito, R. and Karatzas, D. and Valveny, E. and Jawahar, C.V.", TITLE = "InfographicVQA", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "2582-2591", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193819"} @inproceedings{bb198619, AUTHOR = "Kumar, S. and Patro, B.N. and Namboodiri, V.P.", TITLE = "Auto QA: The Question Is Not Only What, but Also Where", BOOKTITLE = Novelty22, YEAR = "2022", PAGES = "272-281", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193820"} @inproceedings{bb198620, AUTHOR = "Kolling, C. and More, M. and Gavenski, N. and Pooch, E. and Parraga, O. and Barros, R.C.", TITLE = "Efficient Counterfactual Debiasing for Visual Question Answering", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "2572-2581", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193821"} @inproceedings{bb198621, AUTHOR = "Jung, S.J. and Byun, J. and Shim, K. and Hwang, S.Y. and Kim, C.", TITLE = "Understanding VQA for Negative Answers Through Visual and Linguistic Inference", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "2873-2877", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193822"} @inproceedings{bb198622, AUTHOR = "Felix, R. and Repasky, B. and Hodge, S. and Zolfaghari, R. and Abbasnejad, E. and Sherrah, J.", TITLE = "Cross-Modal Visual Question Answering for Remote Sensing Data: the International Conference on Digital Image Computing: Techniques and Applications (DICTA 2021)", BOOKTITLE = DICTA21, YEAR = "2021", PAGES = "1-9", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193823"} @inproceedings{bb198623, AUTHOR = "Le, T. and Nguyen, H.T. and Nguyen, M.L.", TITLE = "Vision and Text Transformer for Predicting Answerability on Visual Question Answering", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "934-938", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193824"} @inproceedings{bb198624, AUTHOR = "Huang, Z.Q. and Zhu, H.Y. and Sun, Y. and Choi, D. and Tan, C. and Lim, J.H.", TITLE = "A Diagnostic Study of Visual Question Answering With Analogical Reasoning", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "2463-2467", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193825"} @inproceedings{bb198625, AUTHOR = "Chen, H.Y. and Liu, R.F. and Peng, B.", TITLE = "Cross-modal Relational Reasoning Network for Visual Question Answering", BOOKTITLE = MAIR2-21, YEAR = "2021", PAGES = "3939-3948", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193826"} @inproceedings{bb198626, AUTHOR = "Wang, Z.X. and Miao, Y. and Specia, L.", TITLE = "Latent Variable Models for Visual Question Answering", BOOKTITLE = CLVL21, YEAR = "2021", PAGES = "3137-3141", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193827"} @inproceedings{bb198627, AUTHOR = "Hirota, Y. and Garcia, N. and Otani, M. and Chu, C. and Nakashima, Y. and Taniguchi, I. and Onoye, T.", TITLE = "Visual Question Answering with Textual Representations for Images", BOOKTITLE = CLVL21, YEAR = "2021", PAGES = "3147-3150", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193828"} @inproceedings{bb198628, AUTHOR = "Ye, K. and Kovashka, A.", TITLE = "Linguistic Structures as Weak Supervision for Visual Scene Graph Generation", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "8285-8295", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193829"} @inproceedings{bb198629, AUTHOR = "Yang, X. and Zhang, H. and Qi, G.J. and Cai, J.F.", TITLE = "Causal Attention for Vision-Language Tasks", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "9842-9852", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193830"} @inproceedings{bb198630, AUTHOR = "Xiao, J.B. and Shang, X. and Yao, A. and Chua, T.S.", TITLE = "NExT-QA: Next Phase of Question-Answering to Explaining Temporal Actions", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "9772-9781", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193831"} @inproceedings{bb198631, AUTHOR = "Chen, X.Y. and Jiang, M. and Zhao, Q.", TITLE = "Predicting Human Scanpaths in Visual Question Answering", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "10871-10880", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193832"} @inproceedings{bb198632, AUTHOR = "Qi, Y.G. and Zhang, K. and Sain, A. and Song, Y.Z.", TITLE = "PQA: Perceptual Question Answering", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "12051-12059", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193833"} @inproceedings{bb198633, AUTHOR = "Yuan, Y.Y. and Wang, S. and Jiang, M.Y. and Chen, T.Y.", TITLE = "Perception Matters: Detecting Perception Failures of VQA Models Using Metamorphic Testing", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "16903-16912", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193834"} @inproceedings{bb198634, AUTHOR = "Marino, K. and Chen, X.L. and Parikh, D. and Gupta, A. and Rohrbach, M.", TITLE = "KRISP: Integrating Implicit and Symbolic Knowledge for Open-Domain Knowledge-Based VQA", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "14106-14116", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193835"} @inproceedings{bb198635, AUTHOR = "Niu, Y. and Tang, K. and Zhang, H. and Lu, Z.W. and Hua, X.S. and Wen, J.R.", TITLE = "Counterfactual VQA: A Cause-Effect Look at Language Bias", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "12695-12705", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193836"} @inproceedings{bb198636, AUTHOR = "Yang, Z.Y. and Lu, Y.J. and Wang, J.F. and Yin, X. and Florencio, D. and Wang, L.J. and Zhang, C. and Zhang, L. and Luo, J.B.", TITLE = "TAP: Text-Aware Pre-training for Text-VQA and Text-Caption", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "8747-8757", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193837"} @inproceedings{bb198637, AUTHOR = "Kervadec, C. and Jaunet, T. and Antipov, G. and Baccouche, M. and Vuillemot, R. and Wolf, C.", TITLE = "How Transferable are Reasoning Patterns in VQA?", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "4205-4214", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193838"} @inproceedings{bb198638, AUTHOR = "Kervadec, C. and Antipov, G. and Baccouche, M. and Wolf, C.", TITLE = "Roses are Red, Violets are Blue… But Should VQA expect Them To?", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "2775-2784", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193839"} @inproceedings{bb198639, AUTHOR = "Cho, J.W. and Kim, D.J. and Choi, J. and Jung, Y. and Kweon, I.S.", TITLE = "Dealing with Missing Modalities in the Visual Question Answer-Difference Prediction Task through Knowledge Distillation", BOOKTITLE = MULA21, YEAR = "2021", PAGES = "1592-1601", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193840"} @inproceedings{bb198640, AUTHOR = "Dua, R. and Kancheti, S.S. and Balasubramanian, V.N.", TITLE = "Beyond VQA: Generating Multi-word Answers and Rationales to Visual Questions", BOOKTITLE = MULA21, YEAR = "2021", PAGES = "1623-1632", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193841"} @inproceedings{bb198641, AUTHOR = "Rahman, T. and Chou, S.H. and Sigal, L. and Carenini, G.", TITLE = "An Improved Attention for Visual Question Answering", BOOKTITLE = MULA21, YEAR = "2021", PAGES = "1653-1662", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193842"} @inproceedings{bb198642, AUTHOR = "Stefanini, M. and Cornia, M. and Baraldi, L. and Cucchiara, R.", TITLE = "A Novel Attention-based Aggregation Function to Combine Vision and Language", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "1212-1219", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193843"} @inproceedings{bb198643, AUTHOR = "Jolly, S. and Palacio, S. and Folz, J. and Raue, F. and Hees, J. and Dengel, A.", TITLE = "P ˜ NP, at least in Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "2748-2754", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193844"} @inproceedings{bb198644, AUTHOR = "Liang, Y.Y. and Wang, X. and Duan, X.G. and Zhu, W.W.", TITLE = "Multi-modal Contextual Graph Neural Network for Text Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "3491-3498", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193845"} @inproceedings{bb198645, AUTHOR = "Farazi, M. and Khan, S. and Barnes, N.", TITLE = "Question-Agnostic Attention for Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "3542-3549", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193846"} @inproceedings{bb198646, AUTHOR = "Li, Y. and Lin, Y. and Zhao, H.H. and Wang, D.H.", TITLE = "Dual Path Multi-Modal High-Order Features for Textual Content based Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "4324-4331", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193847"} @inproceedings{bb198647, AUTHOR = "Mishra, A. and Anand, A. and Guha, P.", TITLE = "Multi-stage Attention based Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "9407-9414", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193848"} @inproceedings{bb198648, AUTHOR = "Bozinis, T. and Passalis, N. and Tefas, A.", TITLE = "Improving Visual Question Answering using Active Perception on Static Images", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "879-884", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193849"} @inproceedings{bb198649, AUTHOR = "Huang, H.T. and Han, T. and Han, W. and Yap, D. and Chiang, C.M.", TITLE = "Answer-checking in Context: A Multi-modal Fully Attention Network for Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "1173-1180", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193850"} @inproceedings{bb198650, AUTHOR = "Sun, Q. and Xie, B.H. and Fu, Y.W.", TITLE = "Second Order Enhanced Multi-Glimpse Attention in Visual Question Answering", BOOKTITLE = ACCV20, YEAR = "2020", PAGES = "IV:87-103", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193851"} @inproceedings{bb198651, AUTHOR = "Goel, V. and Chandak, M. and Anand, A. and Guha, P.", TITLE = "IQ-VQA: Intelligent Visual Question Answering", BOOKTITLE = VTIUR20, YEAR = "2020", PAGES = "357-370", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193852"} @inproceedings{bb198652, AUTHOR = "Tan, S. and Xiang, W. and Liu, H.P. and Guo, D. and Sun, F.C.", TITLE = "Multi-agent Embodied Question Answering in Interactive Environments", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XIII:663-678", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193853"} @inproceedings{bb198653, AUTHOR = "Qiao, Y. and Yu, Z. and Liu, J.", TITLE = "VC-VQA: Visual Calibration Mechanism For Visual Question Answering", BOOKTITLE = ICIP20, YEAR = "2020", PAGES = "1481-1485", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193854"} @inproceedings{bb198654, AUTHOR = "Jain, V. and Lodhavia, J.", TITLE = "Automatic Question Tagging using k-Nearest Neighbors and Random Forest", BOOKTITLE = ISCV20, YEAR = "2020", PAGES = "1-4", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193855"} @inproceedings{bb198655, AUTHOR = "Tang, R.X. and Ma, C. and Zhang, W.E. and Wu, Q. and Yang, X.K.", TITLE = "Semantic Equivalent Adversarial Data Augmentation for Visual Question Answering", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XIX:437-453", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193856"} @inproceedings{bb198656, AUTHOR = "Gokhale, T. and Banerjee, P. and Baral, C. and Yang, Y.Z.", TITLE = "VQA-LOL: Visual Question Answering Under the Lens of Logic", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XXI:379-396", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193857"} @inproceedings{bb198657, AUTHOR = "Yang, X.F. and Lin, G.S. and Lv, F.M. and Liu, F.Y.", TITLE = "TRRNET: Tiered Relation Reasoning for Compositional Visual Question Answering", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XXI:414-430", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193858"} @inproceedings{bb198658, AUTHOR = "Bansal, A. and Zhang, Y. and Chellappa, R.", TITLE = "Visual Question Answering on Image Sets", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "XXI:51-67", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193859"} @inproceedings{bb198659, AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Zhang, W.G. and Huang, Q.M. and Tian, Q.", TITLE = "Interpretable Visual Reasoning via Probabilistic Formulation Under Natural Supervision", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "IX:553-570", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193860"} @inproceedings{bb198660, AUTHOR = "Kant, Y. and Batra, D. and Anderson, P. and Schwing, A. and Parikh, D. and Lu, J. and Agrawal, H.", TITLE = "Spatially Aware Multimodal Transformers for TextVQA", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "IX:715-732", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193861"} @inproceedings{bb198661, AUTHOR = "Li, Q. and Huang, S.Y. and Hong, Y. and Zhu, S.C.", TITLE = "A Competence-aware Curriculum for Visual Concepts Learning via Question Answering", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "II:141-157", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193862"} @inproceedings{bb198662, AUTHOR = "Zheng, W.B. and Yan, L. and Gou, C. and Wang, F.Y.", TITLE = "Webly Supervised Knowledge Embedding Model for Visual Reasoning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "12442-12451", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193863"} @inproceedings{bb198663, AUTHOR = "Wang, P. and Wu, Q. and Cao, J.W. and Shen, C.H. and Gao, L.L. and van den Hengel, A.J.", TITLE = "Neighbourhood Watch: Referring Expression Comprehension via Language-Guided Graph Attention Networks", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "1960-1968", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193864"} @inproceedings{bb198664, AUTHOR = "Bajaj, G. and Bandyopadhyay, B. and Schmidt, D. and Maneriker, P. and Myers, C. and Parthasarathy, S.", TITLE = "Understanding Knowledge Gaps in Visual Question Answering: Implications for Gap Identification and Testing", BOOKTITLE = MVM20, YEAR = "2020", PAGES = "1563-1566", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193865"} @inproceedings{bb198665, AUTHOR = "Chen, L. and Yan, X. and Xiao, J. and Zhang, H. and Pu, S. and Zhuang, Y.", TITLE = "Counterfactual Samples Synthesizing for Robust Visual Question Answering", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10797-10806", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193866"} @inproceedings{bb198666, AUTHOR = "Vatashsky, B. and Ullman, S.", TITLE = "VQA With No Questions-Answers Training", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10373-10383", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193867"} @inproceedings{bb198667, AUTHOR = "Jiang, H. and Misra, I. and Rohrbach, M. and Learned Miller, E.G. and Chen, X.", TITLE = "In Defense of Grid Features for Visual Question Answering", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10264-10273", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193868"} @inproceedings{bb198668, AUTHOR = "Wang, X. and Liu, Y. and Shen, C. and Ng, C.C. and Luo, C. and Jin, L. and Chan, C.S. and van den Hengel, A. and Wang, L.", TITLE = "On the General Value of Evidence, and Bilingual Scene-Text Visual Question Answering", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10123-10132", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193869"} @inproceedings{bb198669, AUTHOR = "Xiong, P. and Wu, Y.", TITLE = "TA-Student VQA: Multi-Agents Training by Self-Questioning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10062-10072", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193870"} @inproceedings{bb198670, AUTHOR = "Agarwal, V. and Shetty, R. and Fritz, M.", TITLE = "Towards Causal VQA: Revealing and Reducing Spurious Correlations by Invariant and Covariant Semantic Editing", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "9687-9695", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193871"} @inproceedings{bb198671, AUTHOR = "Hu, R. and Singh, A. and Darrell, T.J. and Rohrbach, M.", TITLE = "Iterative Answer Prediction With Pointer-Augmented Multimodal Transformers for TextVQA", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "9989-9999", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193872"} @inproceedings{bb198672, AUTHOR = "Kafle, K. and Shrestha, R. and Price, B. and Cohen, S. and Kanan, C.", TITLE = "Answering Questions about Data Visualizations using Efficient Bimodal Fusion", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1487-1496", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193873"} @inproceedings{bb198673, AUTHOR = "Patro, B.N. and Kurmi, V.K. and Kumar, S. and Namboodiri, V.P.", TITLE = "Deep Bayesian Network for Visual Question Generation", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1555-1565", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193874"} @inproceedings{bb198674, AUTHOR = "Patro, B.N. and Patel, S. and Namboodiri, V.P.", TITLE = "Robust Explanations for Visual Question Answering", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1566-1575", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193875"} @inproceedings{bb198675, AUTHOR = "Chou, S. and Chao, W. and Lai, W. and Sun, M. and Yang, M.", TITLE = "Visual Question Answering on 360° Images", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1596-1605", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193876"} @inproceedings{bb198676, AUTHOR = "Chaudhry, R. and Shekhar, S. and Gupta, U. and Maneriker, P. and Bansal, P. and Joshi, A.", TITLE = "LEAF-QA: Locate, Encode Attend for Figure Question Answering", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "3501-3510", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193877"} @inproceedings{bb198677, AUTHOR = "Liang, Y.Z. and Bai, Y.L. and Zhang, W. and Qian, X.M. and Zhu, L. and Mei, T.", TITLE = "VrR-VG: Refocusing Visually-Relevant Relationships", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "10402-10411", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193878"} @inproceedings{bb198678, AUTHOR = "Singh, A.K. and Mishra, A. and Shekhar, S. and Chakraborty, A.", TITLE = "From Strings to Things: Knowledge-Enabled VQA Model That Can Read and Reason", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "4601-4611", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193879"} @inproceedings{bb198679, AUTHOR = "Bhattacharya, N. and Li, Q. and Gurari, D.", TITLE = "Why Does a Visual Question Have Different Answers?", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "4270-4279", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193880"} @inproceedings{bb198680, AUTHOR = "Li, L. and Gan, Z. and Cheng, Y. and Liu, J.", TITLE = "Relation-Aware Graph Attention Network for Visual Question Answering", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "10312-10321", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193881"} @inproceedings{bb198681, AUTHOR = "Peng, G. and You, H.X. and Zhang, Z.P. and Wang, X.G. and Li, H.S.", TITLE = "Multi-Modality Latent Interaction Network for Visual Question Answering", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "5824-5834", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193882"} @inproceedings{bb198682, AUTHOR = "Do, T. and Tran, H. and Do, T. and Tjiputra, E. and Tran, Q.", TITLE = "Compact Trilinear Interaction for Visual Question Answering", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "392-401", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193883"} @inproceedings{bb198683, AUTHOR = "Nguyen, D.K. and Okatani, T.", TITLE = "Multi-Task Learning of Hierarchical Vision-Language Representation", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "10484-10493", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193884"} @inproceedings{bb198684, AUTHOR = "Schwartz, I. and Yu, S. and Hazan, T. and Schwing, A.G.", TITLE = "Factor Graph Attention", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "2039-2048", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193885"} @inproceedings{bb198685, AUTHOR = "Kolesnikov, A. and Beyer, L. and Zhai, X.H. and Puigcerver, J. and Yung, J. and Gelly, S. and Houlsby, N.", TITLE = "Big Transfer (BIT): General Visual Representation Learning", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "V:491-507", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193886"} @inproceedings{bb198686, AUTHOR = "Kolesnikov, A. and Zhai, X.H. and Beyer, L.", TITLE = "Revisiting Self-Supervised Visual Representation Learning", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "1920-1929", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193887"} @inproceedings{bb198687, AUTHOR = "Xiong, P.X. and Zhan, H.Y. and Wang, X. and Sinha, B. and Wu, Y.", TITLE = "Visual Query Answering by Entity-Attribute Graph Matching and Reasoning", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "8349-8358", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193888"} @inproceedings{bb198688, AUTHOR = "Singh, A. and Natarajan, V. and Shah, M. and Jiang, Y. and Chen, X.L. and Batra, D. and Parikh, D. and Rohrbach, M.", TITLE = "Towards VQA Models That Can Read", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "8309-8318", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193889"} @inproceedings{bb198689, AUTHOR = "Manjunatha, V. and Saini, N. and Davis, L.S.", TITLE = "Explicit Bias Discovery in Visual Question Answering Models", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "9554-9563", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193890"} @inproceedings{bb198690, AUTHOR = "Shrestha, R. and Kafle, K. and Kanan, C.", TITLE = "Answer Them All! Toward Universal Visual Question Answering Models", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "10464-10473", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193891"} @inproceedings{bb198691, AUTHOR = "Wilf, A. and Ma, M.Q. and Liang, P.P. and Zadeh, A. and Morency, L.P.", TITLE = "Face-to-Face Contrastive Learning for Social Intelligence Question-Answering", BOOKTITLE = FG23, YEAR = "2023", PAGES = "1-7", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193892"} @inproceedings{bb198692, AUTHOR = "Zadeh, A. and Chan, M. and Liang, P.P. and Tong, E. and Morency, L.P.", TITLE = "Social-IQ: A Question Answering Benchmark for Artificial Social Intelligence", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "8799-8809", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193893"} @inproceedings{bb198693, AUTHOR = "Noh, H. and Kim, T. and Mun, J. and Han, B.H.", TITLE = "Transfer Learning via Unsupervised Task Discovery for Visual Question Answering", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "8377-8386", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193894"} @inproceedings{bb198694, AUTHOR = "Wijmans, E. and Datta, S. and Maksymets, O. and Das, A. and Gkioxari, G. and Lee, S. and Essa, I. and Parikh, D. and Batra, D.", TITLE = "Embodied Question Answering in Photorealistic Environments With Point Cloud Perception", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6652-6661", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193895"} @inproceedings{bb198695, AUTHOR = "Shah, M. and Chen, X.L. and Rohrbach, M. and Parikh, D.", TITLE = "Cycle-Consistency for Robust Visual Question Answering", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6642-6651", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193896"} @inproceedings{bb198696, AUTHOR = "Li, H. and Wang, P. and Shen, C.H. and van den Hengel, A.", TITLE = "Visual Question Answering as Reading Comprehension", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6312-6321", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193897"} @inproceedings{bb198697, AUTHOR = "Yu, L.C. and Chen, X.L. and Gkioxari, G. and Bansal, M. and Berg, T.L. and Batra, D.", TITLE = "Multi-Target Embodied Question Answering", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6302-6311", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193898"} @inproceedings{bb198698, AUTHOR = "Yu, Z. and Yu, J. and Cui, Y. and Tao, D.C. and Tian, Q.", TITLE = "Deep Modular Co-Attention Networks for Visual Question Answering", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "6274-6283", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193899"} @inproceedings{bb198699, AUTHOR = "Abbasnejad, E. and Wu, Q. and Shi, Q.F. and van den Hengel, A.", TITLE = "What's to Know? Uncertainty as a Guide to Asking Goal-Oriented Questions", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "4150-4159", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193900"}