@inproceedings{bb198500, AUTHOR = "Malinowski, M. and Rohrbach, M. and Fritz, M.", TITLE = "Ask Your Neurons: A Neural-Based Approach to Answering Questions about Images", BOOKTITLE = ICCV15, YEAR = "2015", PAGES = "1-9", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193702"} @article{bb198501, AUTHOR = "Tamaazousti, Y. and Le Borgne, H. and Popescu, A. and Gadeski, E. and Ginsca, A. and Hudelot, C.", TITLE = "Vision-language integration using constrained local semantic features", JOURNAL = CVIU, VOLUME = "163", YEAR = "2017", NUMBER = "1", PAGES = "41-57", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193703"} @article{bb198502, AUTHOR = "Das, A. and Agrawal, H. and Zitnick, L. and Parikh, D. and Batra, D.", TITLE = "Human Attention in Visual Question Answering: Do Humans and Deep Networks Look at the Same Regions?", JOURNAL = CVIU, VOLUME = "163", YEAR = "2017", NUMBER = "1", PAGES = "90-100", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193704"} @article{bb198503, AUTHOR = "Lioutas, V. and Passalis, N. and Tefas, A.", TITLE = "Explicit ensemble attention learning for improving visual question answering", JOURNAL = PRL, VOLUME = "111", YEAR = "2018", PAGES = "51-57", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193705"} @article{bb198504, AUTHOR = "Huang, Y.Z. and Zhong, T.", TITLE = "Multitask learning for neural generative question answering", JOURNAL = RealTimeIP, VOLUME = "14", YEAR = "2018", NUMBER = "1", MONTH = "January", PAGES = "1009-1017", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193706"} @article{bb198505, AUTHOR = "Zhang, Q.S. and Wu, Y.N. and Zhang, H. and Zhu, S.C.", TITLE = "Mining deep And-Or object structures via cost-sensitive question-answer-based active annotations", JOURNAL = CVIU, VOLUME = "176-177", YEAR = "2018", PAGES = "33-44", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193707"} @article{bb198506, AUTHOR = "Zhang, Q.S. and Ren, J. and Huang, G. and Cao, R.M. and Wu, Y.N. and Zhu, S.C.", TITLE = "Mining Interpretable AOG Representations From Convolutional Networks via Active Question Answering", JOURNAL = PAMI, VOLUME = "43", YEAR = "2021", NUMBER = "11", MONTH = "November", PAGES = "3949-3963", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193708"} @inproceedings{bb198507, AUTHOR = "Zhang, Q.S. and Cao, R.M. and Wu, Y.N. and Zhu, S.C.", TITLE = "Mining Object Parts from CNNs via Active Question-Answering", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "3890-3899", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193709"} @inproceedings{bb198508, AUTHOR = "Zhang, Q.S. and Wu, Y.N. and Zhu, S.C.", TITLE = "Mining And-Or Graphs for Graph Matching and Object Discovery", BOOKTITLE = ICCV15, YEAR = "2015", PAGES = "55-63", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193710"} @article{bb198509, AUTHOR = "Garg, S. and Srivastava, R.", TITLE = "Object sequences: encoding categorical and spatial information for a yes/no visual question answering task", JOURNAL = IET-CV, VOLUME = "12", YEAR = "2018", NUMBER = "8", MONTH = "December", PAGES = "1141-1150", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193711"} @article{bb198510, AUTHOR = "Goyal, Y. and Khot, T. and Agrawal, A. and Summers Stay, D. and Batra, D. and Parikh, D.", TITLE = "Making the V in VQA Matter: Elevating the Role of Image Understanding in Visual Question Answering", JOURNAL = IJCV, VOLUME = "127", YEAR = "2019", NUMBER = "4", MONTH = "April", PAGES = "398-414", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193712"} @inproceedings{bb198511, AUTHOR = "Goyal, Y. and Khot, T. and Summers Stay, D. and Batra, D. and Parikh, D.", TITLE = "Making the V in VQA Matter: Elevating the Role of Image Understanding in Visual Question Answering", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "6325-6334", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193712"} @article{bb198512, AUTHOR = "Fang, Z.W. and Liu, J. and Li, Y. and Qiao, Y.Y. and Lu, H.Q.", TITLE = "Improving visual question answering using dropout and enhanced question encoder", JOURNAL = PR, VOLUME = "90", YEAR = "2019", PAGES = "404-414", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193713"} @article{bb198513, AUTHOR = "Osman, A. and Samek, W.", TITLE = "DRAU: Dual Recurrent Attention Units for Visual Question Answering", JOURNAL = CVIU, VOLUME = "185", YEAR = "2019", PAGES = "24-30", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193714"} @article{bb198514, AUTHOR = "Toor, A.S. and Wechsler, H. and Nappi, M.", TITLE = "Biometric surveillance using visual question answering", JOURNAL = PRL, VOLUME = "126", YEAR = "2019", PAGES = "111-118", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193715"} @article{bb198515, AUTHOR = "Ruwa, N. and Mao, Q. and Song, H.P. and Jia, H.J. and Dong, M.", TITLE = "Triple attention network for sentimental visual question answering", JOURNAL = CVIU, VOLUME = "189", YEAR = "2019", PAGES = "102829", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193716"} @article{bb198516, AUTHOR = "Li, W.W. and Song, M.M. and Tian, Y.Y.", TITLE = "An Ontology-Driven Cyberinfrastructure for Intelligent Spatiotemporal Question Answering and Open Knowledge Discovery", JOURNAL = IJGI, VOLUME = "8", YEAR = "2019", NUMBER = "11", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193717"} @article{bb198517, AUTHOR = "Xi, Y.L. and Zhang, Y.N. and Ding, S.T. and Wan, S.H.", TITLE = "Visual Question Answering Model Based on Visual Relationship Detection", JOURNAL = SP:IC, VOLUME = "80", YEAR = "2020", PAGES = "115648", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193718"} @article{bb198518, AUTHOR = "Wu, Y. and Jiang, L. and Yang, Y.", TITLE = "Revisiting EmbodiedQA: A Simple Baseline and Beyond", JOURNAL = IP, VOLUME = "29", YEAR = "2020", PAGES = "3984-3992", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193719"} @article{bb198519, AUTHOR = "Huang, C. and Yao, L. and Wang, X.Z. and Benatallah, B. and Zhang, X.", TITLE = "Software expert discovery via knowledge domain embeddings in a collaborative network", JOURNAL = PRL, VOLUME = "130", YEAR = "2020", PAGES = "46-53", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193720"} @article{bb198520, AUTHOR = "Li, W. and Sun, J.H. and Liu, G. and Zhao, L. and Fang, X.Z.", TITLE = "Visual question answering with attention transfer and a cross-modal gating mechanism", JOURNAL = PRL, VOLUME = "133", YEAR = "2020", PAGES = "334-340", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193721"} @article{bb198521, AUTHOR = "Messina, N. and Amato, G. and Carrara, F. and Falchi, F. and Gennaro, C.", TITLE = "Learning visual features for relational CBIR", JOURNAL = MultInfoRetr, VOLUME = "9", YEAR = "2020", NUMBER = "2", MONTH = "June", PAGES = "113-124", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193722"} @inproceedings{bb198522, AUTHOR = "Messina, N. and Amato, G. and Carrara, F. and Falchi, F. and Gennaro, C.", TITLE = "Learning Relationship-Aware Visual Features", BOOKTITLE = CEFR-LCV18, YEAR = "2018", PAGES = "IV:486-501", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193723"} @inproceedings{bb198523, AUTHOR = "Methani, N. and Ganguly, P. and Khapra, M.M. and Kumar, P.", TITLE = "PlotQA: Reasoning over Scientific Plots", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1516-1525", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193724"} @article{bb198524, AUTHOR = "Yu, J. and Zhu, Z.H. and Wang, Y.J. and Zhang, W.F. and Hu, Y. and Tan, J.L.", TITLE = "Cross-modal knowledge reasoning for knowledge-based visual question answering", JOURNAL = PR, VOLUME = "108", YEAR = "2020", PAGES = "107563", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193725"} @inproceedings{bb198525, AUTHOR = "Yang, Z.Q. and Qin, Z.C. and Yu, J. and Wan, T.", TITLE = "Prior Visual Relationship Reasoning For Visual Question Answering", BOOKTITLE = ICIP20, YEAR = "2020", PAGES = "1411-1415", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193726"} @article{bb198526, AUTHOR = "Bai, Z.W. and Li, Y. and Wozniak, M. and Zhou, M.L. and Li, D.", TITLE = "DecomVQANet: Decomposing visual question answering deep network via tensor decomposition and regression", JOURNAL = PR, VOLUME = "110", YEAR = "2021", PAGES = "107538", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193727"} @article{bb198527, AUTHOR = "Farazi, M.R. and Khan, S.H. and Barnes, N.", TITLE = "From known to the unknown: Transferring knowledge to answer questions about novel visual and semantic concepts", JOURNAL = IVC, VOLUME = "103", YEAR = "2020", PAGES = "103985", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193728"} @article{bb198528, AUTHOR = "Terao, K. and Tamaki, T. and Raytchev, B. and Kaneda, K. and Satoh, S.", TITLE = "Rephrasing Visual Questions by Specifying the Entropy of the Answer Distribution", JOURNAL = IEICE, VOLUME = "E103-D", YEAR = "2020", NUMBER = "11", MONTH = "November", PAGES = "2362-2370", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193729"} @article{bb198529, AUTHOR = "Yu, J. and Zhang, W.F. and Lu, Y.H. and Qin, Z.C. and Hu, Y. and Tan, J.L. and Wu, Q.", TITLE = "Reasoning on the Relation: Enhancing Visual Representation for Visual Question Answering and Cross-Modal Retrieval", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "12", MONTH = "December", PAGES = "3196-3209", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193730"} @article{bb198530, AUTHOR = "Lobry, S. and Marcos, D. and Murray, J. and Tuia, D.", TITLE = "RSVQA: Visual Question Answering for Remote Sensing Data", JOURNAL = GeoRS, VOLUME = "58", YEAR = "2020", NUMBER = "12", MONTH = "December", PAGES = "8555-8566", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193731"} @inproceedings{bb198531, AUTHOR = "Faure, M. and Lobry, S. and Kurtz, C. and Wendling, L.", TITLE = "Embedding Spatial Relations in Visual Question Answering for Remote Sensing", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "310-316", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193732"} @inproceedings{bb198532, AUTHOR = "Chappuis, C. and Zermatten, V. and Lobry, S. and Le Saux, B. and Tuia, D.", TITLE = "Prompt-RSVQA: Prompting visual context to a language model for Remote Sensing Visual Question Answering", BOOKTITLE = EarthVision22, YEAR = "2022", PAGES = "1371-1380", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193733"} @article{bb198533, AUTHOR = "Sun, B. and Yao, Z. and Zhang, Y.H. and Yu, L.J.", TITLE = "Local relation network with multilevel attention for visual question answering", JOURNAL = JVCIR, VOLUME = "73", YEAR = "2020", PAGES = "102762", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193734"} @article{bb198534, AUTHOR = "Wang, J.M. and Cui, E. and Liu, K.L. and Sun, Y.K. and Liang, J.Y. and Yuan, C.M. and Duan, X.J. and Jin, G.H. and Chung, T.S.", TITLE = "Referring expression comprehension model with matching detection and linguistic feedback", JOURNAL = IET-CV, VOLUME = "14", YEAR = "2020", NUMBER = "8", MONTH = "December", PAGES = "625-633", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193735"} @article{bb198535, AUTHOR = "Li, X. and Yuan, A. and Lu, X.", TITLE = "Vision-to-Language Tasks Based on Attributes and Attention Mechanism", JOURNAL = Cyber, VOLUME = "51", YEAR = "2021", NUMBER = "2", MONTH = "February", PAGES = "913-926", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193736"} @article{bb198536, AUTHOR = "Cao, Q.X. and Liang, X.D. and Li, B.L. and Lin, L.", TITLE = "Interpretable Visual Question Answering by Reasoning on Dependency Trees", JOURNAL = PAMI, VOLUME = "43", YEAR = "2021", NUMBER = "3", MONTH = "March", PAGES = "887-901", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193737"} @inproceedings{bb198537, AUTHOR = "Cao, Q.X. and Liang, X.D. and Li, B.L. and Li, G. and Lin, L.", TITLE = "Visual Question Reasoning on General Dependency Tree", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7249-7257", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193738"} @article{bb198538, AUTHOR = "Shao, Y. and Lin, J.C.W. and Srivastava, G. and Jolfaei, A. and Guo, D.D. and Hu, Y.", TITLE = "Self-attention-based conditional random fields latent variables model for sequence labeling", JOURNAL = PRL, VOLUME = "145", YEAR = "2021", PAGES = "157-164", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193739"} @article{bb198539, AUTHOR = "Zhong, H.S. and Chen, J.Y. and Shen, C. and Zhang, H.W. and Huang, J.Q. and Hua, X.S.", TITLE = "Self-Adaptive Neural Module Transformer for Visual Question Answering", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "1264-1273", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193740"} @article{bb198540, AUTHOR = "Sharma, H. and Jalal, A.S.", TITLE = "Visual question answering model based on graph neural network and contextual attention", JOURNAL = IVC, VOLUME = "110", YEAR = "2021", PAGES = "104165", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193741"} @article{bb198541, AUTHOR = "Wu, Y. and Ma, Y.T. and Wan, S.H.", TITLE = "Multi-scale relation reasoning for multi-modal Visual Question Answering", JOURNAL = SP:IC, VOLUME = "96", YEAR = "2021", PAGES = "116319", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193742"} @inproceedings{bb198542, AUTHOR = "Ma, Y.T. and Lu, T. and Wu, Y.", TITLE = "Multi-scale Relational Reasoning with Regional Attention for Visual Question Answering", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "5642-5649", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193743"} @article{bb198543, AUTHOR = "dos S Silva, F.H. and Bezerra, G.M. and Holanda, G.B. and de Souza, J.W.M. and Rego, P.A.L. and Lira Neto, A.V. and de Albuquerque, V.H.C. and Reboucas Filho, P.P.", TITLE = "A novel feature extractor for human action recognition in visual question answering", JOURNAL = PRL, VOLUME = "147", YEAR = "2021", PAGES = "41-47", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193744"} @article{bb198544, AUTHOR = "Guo, W. and Zhang, Y. and Yang, J.F. and Yuan, X.J.", TITLE = "Re-Attention for Visual Question Answering", JOURNAL = IP, VOLUME = "30", YEAR = "2021", PAGES = "6730-6743", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193745"} @article{bb198545, AUTHOR = "Hu, J. and Qian, S. and Fang, Q. and Xu, C.S.", TITLE = "Heterogeneous Community Question Answering via Social-Aware Multi-Modal Co-Attention Convolutional Matching", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "2321-2334", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193746"} @article{bb198546, AUTHOR = "Farazi, M. and Khan, S. and Barnes, N.", TITLE = "Accuracy vs. complexity: A trade-off in visual question answering models", JOURNAL = PR, VOLUME = "120", YEAR = "2021", PAGES = "108106", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193747"} @article{bb198547, AUTHOR = "Zheng, W.F. and Yin, L.R. and Chen, X.B. and Ma, Z. and Liu, S. and Yang, B.", TITLE = "Knowledge base graph embedding module design for Visual question answering model", JOURNAL = PR, VOLUME = "120", YEAR = "2021", PAGES = "108153", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193748"} @article{bb198548, AUTHOR = "Barra, S. and Bisogni, C. and de Marsico, M. and Ricciardi, S.", TITLE = "Visual question answering: Which investigated applications?", JOURNAL = PRL, VOLUME = "151", YEAR = "2021", PAGES = "325-331", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193749"} @article{bb198549, AUTHOR = "Manmadhan, S. and Kovoor, B.C.", TITLE = "Multi-Tier Attention Network using Term-weighted Question Features for Visual Question Answering", JOURNAL = IVC, VOLUME = "115", YEAR = "2021", PAGES = "104291", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193750"} @article{bb198550, AUTHOR = "Liu, A.A. and Lu, Z. and Xu, N. and Nie, W.Z. and Li, W.H.", TITLE = "Multi-type decision fusion network for visual Q&A", JOURNAL = IVC, VOLUME = "115", YEAR = "2021", PAGES = "104281", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193751"} @article{bb198551, AUTHOR = "Patro, B.N. and Kurmi, V.K. and Kumar, S. and Namboodiri, V.P.", TITLE = "MUMC: Minimizing uncertainty of mixture of cues", JOURNAL = IVC, VOLUME = "115", YEAR = "2021", PAGES = "104280", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193752"} @article{bb198552, AUTHOR = "Liu, F. and Liu, J. and Fang, Z.W. and Hong, R.C. and Lu, H.Q.", TITLE = "Visual Question Answering With Dense Inter- and Intra-Modality Interactions", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "3518-3529", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193753"} @article{bb198553, AUTHOR = "Wu, J.J. and Du, J. and Wang, F. and Yang, C. and Jiang, X.Z. and Hu, J. and Yin, B. and Zhang, J.S. and Dai, L.R.", TITLE = "A multimodal attention fusion network with a dynamic vocabulary for TextVQA", JOURNAL = PR, VOLUME = "122", YEAR = "2022", PAGES = "108214", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193754"} @article{bb198554, AUTHOR = "Narayanan, A. and Rao, A. and Prasad, A. and Natarajan, S.", TITLE = "VQA as a factoid question answering problem: A novel approach for knowledge-aware and explainable visual question answering", JOURNAL = IVC, VOLUME = "116", YEAR = "2021", PAGES = "104328", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193755"} @article{bb198555, AUTHOR = "Guo, Y.Y. and Nie, L.Q. and Cheng, Z.Y. and Tian, Q. and Zhang, M.", TITLE = "Loss Re-Scaling VQA: Revisiting the Language Prior Problem From a Class-Imbalance View", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "227-238", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193756"} @article{bb198556, AUTHOR = "Peng, L. and Yang, Y. and Wang, Z. and Huang, Z. and Shen, H.T.", TITLE = "MRA-Net: Improving VQA Via Multi-Modal Relation Attention Network", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "1", MONTH = "January", PAGES = "318-329", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193757"} @article{bb198557, AUTHOR = "Manogaran, G. and Shakeel, P.M. and Burhanuddin, M.A. and Baskar, S. and Saravanan, V. and Crespo, R.G. and Martinez, O.S.", TITLE = "ADCCF: Adaptive deep concatenation coder framework for visual question answering", JOURNAL = PRL, VOLUME = "152", YEAR = "2021", PAGES = "348-355", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193758"} @article{bb198558, AUTHOR = "Zhou, Y. and Ji, R.R. and Sun, X.S. and Su, J.S. and Meng, D.Y. and Gao, Y. and Shen, C.H.", TITLE = "Plenty is Plague: Fine-Grained Learning for Visual Question Answering", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "2", MONTH = "February", PAGES = "697-709", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193759"} @article{bb198559, AUTHOR = "E, W.N. and Zhou, Y.", TITLE = "A Mathematical Model for Universal Semantics", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "3", MONTH = "March", PAGES = "1124-1132", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193760"} @article{bb198560, AUTHOR = "Li, X.P. and Wu, B. and Song, J.K. and Gao, L.L. and Zeng, P.P. and Gan, C.", TITLE = "Text-instance graph: Exploring the relational semantics for text-based visual question answering", JOURNAL = PR, VOLUME = "124", YEAR = "2022", PAGES = "108455", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193761"} @article{bb198561, AUTHOR = "Shao, X.J. and Xiang, Z.L. and Li, Y.X.", TITLE = "Visual question answering with gated relation-aware auxiliary", JOURNAL = IET-IPR, VOLUME = "16", YEAR = "2022", NUMBER = "5", PAGES = "1424-1432", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193762"} @article{bb198562, AUTHOR = "Liu, Y. and Zhang, X.M. and Zhao, Z.Y. and Zhang, B. and Cheng, L. and Li, Z.J.", TITLE = "ALSA: Adversarial Learning of Supervised Attentions for Visual Question Answering", JOURNAL = Cyber, VOLUME = "52", YEAR = "2022", NUMBER = "6", MONTH = "June", PAGES = "4520-4533", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193763"} @article{bb198563, AUTHOR = "Ouyang, N.L. and Huang, Q.B. and Li, P.J. and Cai, Y. and Liu, B. and Leung, H.F. and Li, Q.", TITLE = "Suppressing Biased Samples for Robust VQA", JOURNAL = MultMed, VOLUME = "24", YEAR = "2022", PAGES = "3405-3415", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193764"} @article{bb198564, AUTHOR = "Shuang, K. and Guo, J. and Wang, Z.", TITLE = "Comprehensive-perception dynamic reasoning for visual question answering", JOURNAL = PR, VOLUME = "131", YEAR = "2022", PAGES = "108878", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193765"} @article{bb198565, AUTHOR = "Gouthaman, K.V. and Mittal, A.", TITLE = "On the role of question encoder sequence model in robust visual question answering", JOURNAL = PR, VOLUME = "131", YEAR = "2022", PAGES = "108883", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193766"} @article{bb198566, AUTHOR = "Zhou, K.Y. and Yang, J.K. and Loy, C.C. and Liu, Z.W.", TITLE = "Learning to Prompt for Vision-Language Models", JOURNAL = IJCV, VOLUME = "130", YEAR = "2022", NUMBER = "9", MONTH = "September", PAGES = "2337-2348", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193767"} @inproceedings{bb198567, AUTHOR = "Zhou, K.Y. and Yang, J.K. and Loy, C.C. and Liu, Z.", TITLE = "Conditional Prompt Learning for Vision-Language Models", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "16795-16804", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193768"} @article{bb198568, AUTHOR = "Chen, C.Q. and Han, D.Z. and Chang, C.C.", TITLE = "CAAN: Context-Aware attention network for visual question answering", JOURNAL = PR, VOLUME = "132", YEAR = "2022", PAGES = "108980", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193769"} @article{bb198569, AUTHOR = "Song, L.Y. and Li, J. and Liu, J. and Yang, Y. and Shang, X. and Sun, M.X.", TITLE = "Answering knowledge-based visual questions via the exploration of Question Purpose", JOURNAL = PR, VOLUME = "133", YEAR = "2023", PAGES = "109015", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193770"} @article{bb198570, AUTHOR = "Xie, J.Y. and Fang, W.H. and Cai, Y. and Huang, Q.B. and Li, Q.", TITLE = "Knowledge-Based Visual Question Generation", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "11", MONTH = "November", PAGES = "7547-7558", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193771"} @article{bb198571, AUTHOR = "Gao, C. and Zhu, Q. and Wang, P. and Li, H. and Liu, Y.L. and van den Hengel, A.J. and Wu, Q.", TITLE = "Structured Multimodal Attentions for TextVQA", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "9603-9614", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193772"} @article{bb198572, AUTHOR = "Jin, Z.X. and Wu, H. and Yang, C. and Zhou, F. and Qin, J.Y. and Xiao, L. and Yin, X.C.", TITLE = "RUArt: A Novel Text-Centered Solution for Text-Based Visual Question Answering", JOURNAL = MultMed, VOLUME = "25", YEAR = "2023", PAGES = "1-12", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193773"} @article{bb198573, AUTHOR = "Beckham, C. and Weiss, M. and Golemo, F. and Honari, S. and Nowrouzezahrai, D. and Pal, C.", TITLE = "Visual question answering from another perspective: CLEVR mental rotation tests", JOURNAL = PR, VOLUME = "136", YEAR = "2023", PAGES = "109209", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193774"} @article{bb198574, AUTHOR = "Zhang, H. and Zeng, P.P. and Hu, Y.X. and Qian, J. and Song, J. and Gao, L.", TITLE = "Learning visual question answering on controlled semantic noisy labels", JOURNAL = PR, VOLUME = "138", YEAR = "2023", PAGES = "109339", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193775"} @article{bb198575, AUTHOR = "Zeng, G. and Zhang, Y. and Zhou, Y. and Yang, X.M. and Jiang, N. and Zhao, G.Q. and Wang, W.P. and Yin, X.C.", TITLE = "Beyond OCR + VQA: Towards end-to-end reading and reasoning for robust and accurate textvqa", JOURNAL = PR, VOLUME = "138", YEAR = "2023", PAGES = "109337", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193776"} @inproceedings{bb198576, AUTHOR = "Jha, A. and Patro, B. and Van Gool, L.J. and Tuytelaars, T.", TITLE = "Barlow constrained optimization for Visual Question Answering", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "1084-1093", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193777"} @inproceedings{bb198577, AUTHOR = "Ravi, S. and Chinchure, A. and Sigal, L. and Liao, R.J. and Shwartz, V.", TITLE = "VLC-BERT: Visual Question Answering with Contextualized Commonsense Knowledge", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "1155-1165", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193778"} @inproceedings{bb198578, AUTHOR = "Uehara, K. and Harada, T.", TITLE = "K-VQG: Knowledge-aware Visual Question Generation for Common-sense Acquisition", BOOKTITLE = WACV23, YEAR = "2023", PAGES = "4390-4398", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193779"} @inproceedings{bb198579, AUTHOR = "Etesam, Y. and Kochiev, L. and Chang, A.X.", TITLE = "3DVQA: Visual Question Answering for 3D Environments", BOOKTITLE = CRV22, YEAR = "2022", PAGES = "233-240", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193780"} @inproceedings{bb198580, AUTHOR = "Haisa, G. and Altenbek, G.", TITLE = "Question Classification Based on Weak Supervision and Interrogative Pronouns Attention Mechanism", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "2273-2278", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193781"} @inproceedings{bb198581, AUTHOR = "Ramamurthy, P. and Aakur, S.N.", TITLE = "ISD-QA: Iterative Distillation of Commonsense Knowledge from General Language Models for Unsupervised Question Answering", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "1229-1235", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193782"} @inproceedings{bb198582, AUTHOR = "Zhang, H. and Wu, W.", TITLE = "CAT: Re-Conv Attention in Transformer for Visual Question Answering", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "1471-1477", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193783"} @inproceedings{bb198583, AUTHOR = "Liu, L. and Su, X.D. and Guo, H. and Zhu, D.", TITLE = "A Transformer-based Medical Visual Question Answering Model", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "1712-1718", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193784"} @inproceedings{bb198584, AUTHOR = "Boecking, B. and Usuyama, N. and Bannur, S. and Castro, D.C. and Schwaighofer, A. and Hyland, S. and Wetscherek, M. and Naumann, T. and Nori, A. and Alvarez Valle, J. and Poon, H. and Oktay, O.", TITLE = "Making the Most of Text Semantics to Improve Biomedical Vision-Language Processing", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:1-21", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193785"} @inproceedings{bb198585, AUTHOR = "Cui, Q. and Zhou, B. and Guo, Y. and Yin, W.D. and Wu, H. and Yoshie, O. and Chen, Y.", TITLE = "Contrastive Vision-Language Pre-training with Limited Resources", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:236-253", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193786"} @inproceedings{bb198586, AUTHOR = "Wu, X.Y. and Lu, J.F. and Li, Z.F. and Xiong, F.C.", TITLE = "Ques-to-Visual Guided Visual Question Answering", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "4193-4197", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193787"} @inproceedings{bb198587, AUTHOR = "Sarkar, A. and Rahnemoonfar, M.", TITLE = "Grad-Cam Aware Supervised Attention for Visual Question Answering for Post-Disaster Damage Assessment", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "3783-3787", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193788"} @inproceedings{bb198588, AUTHOR = "Whitehead, S. and Petryk, S. and Shakib, V. and Gonzalez, J. and Darrell, T.J. and Rohrbach, A. and Rohrbach, M.", TITLE = "Reliable Visual Question Answering: Abstain Rather Than Answer Incorrectly", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:148-166", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193789"} @inproceedings{bb198589, AUTHOR = "Chen, L. and Zheng, Y.H. and Xiao, J.", TITLE = "Rethinking Data Augmentation for Robust Visual Question Answering", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:95-112", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193790"} @inproceedings{bb198590, AUTHOR = "Zhang, H.T. and Wu, W.", TITLE = "Context Relation Fusion Model for Visual Question Answering", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "2112-2116", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193791"} @inproceedings{bb198591, AUTHOR = "Biten, A.F. and Litman, R. and Xie, Y.S. and Appalaraju, S. and Manmatha, R.", TITLE = "LaTr: Layout-Aware Transformer for Scene-Text VQA", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "16527-16537", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193792"} @inproceedings{bb198592, AUTHOR = "Lu, J.Y. and Ye, X. and Ren, Y. and Yang, Y.Z.", TITLE = "Good, Better, Best: Textual Distractors Generation for Multiple-Choice Visual Question Answering via Reinforcement Learning", BOOKTITLE = ODRUM22, YEAR = "2022", PAGES = "4917-4926", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193793"} @inproceedings{bb198593, AUTHOR = "Nguyen, B.X. and Do, T. and Tran, H. and Tjiputra, E. and Tran, Q.D. and Nguyen, A.", TITLE = "Coarse-to-Fine Reasoning for Visual Question Answering", BOOKTITLE = MULA22, YEAR = "2022", PAGES = "4557-4565", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193794"} @inproceedings{bb198594, AUTHOR = "Ding, Y.H. and Huang, Z. and Wang, R. and Zhang, Y.H. and Chen, X. and Ma, Y.Z. and Chung, H. and Han, S.C.", TITLE = "V-Doc: Visual questions answers with Documents", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "21460-21466", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193795"} @inproceedings{bb198595, AUTHOR = "Azuma, D. and Miyanishi, T. and Kurita, S.H. and Kawanabe, M.", TITLE = "ScanQA: 3D Question Answering for Spatial Scene Understanding", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "19107-19117", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193796"} @inproceedings{bb198596, AUTHOR = "Li, G.Y. and Wei, Y. and Tian, Y. and Xu, C.L. and Wen, J.R. and Hu, D.", TITLE = "Learning to Answer Questions in Dynamic Audio-Visual Scenarios", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "19086-19096", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193797"} @inproceedings{bb198597, AUTHOR = "Chen, C. and Anjum, S. and Gurari, D.", TITLE = "Grounding Answers for Visual Questions Asked by Visually Impaired People", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "19076-19085", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193798"} @inproceedings{bb198598, AUTHOR = "Guo, X.Y. and Duan, J.L. and Kuo, C.C.J. and Gichoya, J.W. and Banerjee, I.", TITLE = "Augmenting Vision Language Pretraining by Learning Codebook with Visual Semantics", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "4779-4785", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193799"} @inproceedings{bb198599, AUTHOR = "Yang, J. and Duan, J.L. and Tran, S. and Xu, Y. and Chanda, S. and Chen, L.Q. and Zeng, B. and Chilimbi, T. and Huang, J.Z.", TITLE = "Vision-Language Pre-Training with Triple Contrastive Learning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "15650-15659", BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT193800"}