@inproceedings{bb110800,
        AUTHOR = "Wang, Z. and Feng, B. and Narasimhan, K. and Russakovsky, O.",
        TITLE = "Towards Unique and Informative Captioning of Images",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "VII:629-644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107090"}

@inproceedings{bb110801,
        AUTHOR = "Sidorov, O. and Hu, R.H. and Rohrbach, M. and Singh, A.",
        TITLE = "Textcaps: A Dataset for Image Captioning with Reading Comprehension",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "II:742-758",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107091"}

@inproceedings{bb110802,
        AUTHOR = "Durand, T.",
        TITLE = "Learning User Representations for Open Vocabulary Image Hashtag
Prediction",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "9766-9775",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107092"}

@inproceedings{bb110803,
        AUTHOR = "Prabhudesai, M. and Tung, H.Y.F. and Javed, S.A. and Sieb, M. and Harley, A.W. and Fragkiadaki, K.",
        TITLE = "Embodied Language Grounding With 3D Visual Feature Representations",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "2217-2226",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107093"}

@inproceedings{bb110804,
        AUTHOR = "Li, Z. and Tran, Q. and Mai, L. and Lin, Z. and Yuille, A.L.",
        TITLE = "Context-Aware Group Captioning via Self-Attention and Contrastive
Features",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "3437-3447",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107094"}

@inproceedings{bb110805,
        AUTHOR = "Zhou, Y. and Wang, M. and Liu, D. and Hu, Z. and Zhang, H.",
        TITLE = "More Grounded Image Captioning by Distilling Image-Text Matching
Model",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "4776-4785",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107095"}

@inproceedings{bb110806,
        AUTHOR = "Sammani, F. and Melas Kyriazi, L.",
        TITLE = "Show, Edit and Tell: A Framework for Editing Image Captions",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "4807-4815",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107096"}

@inproceedings{bb110807,
        AUTHOR = "Chen, S. and Jin, Q. and Wang, P. and Wu, Q.",
        TITLE = "Say As You Wish: Fine-Grained Control of Image Caption Generation
With Abstract Scene Graphs",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "9959-9968",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107097"}

@inproceedings{bb110808,
        AUTHOR = "Guo, L. and Liu, J. and Zhu, X. and Yao, P. and Lu, S. and Lu, H.",
        TITLE = "Normalized and Geometry-Aware Self-Attention Network for Image
Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10324-10333",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107098"}

@inproceedings{bb110809,
        AUTHOR = "Cornia, M. and Stefanini, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Meshed-Memory Transformer for Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10575-10584",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107099"}

@inproceedings{bb110810,
        AUTHOR = "Chen, J. and Jin, Q.",
        TITLE = "Better Captioning With Sequence-Level Exploration",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10887-10896",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107100"}

@inproceedings{bb110811,
        AUTHOR = "Pan, Y. and Yao, T. and Li, Y. and Mei, T.",
        TITLE = "X-Linear Attention Networks for Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10968-10977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107101"}

@inproceedings{bb110812,
        AUTHOR = "Tran, A. and Mathews, A. and Xie, L.",
        TITLE = "Transform and Tell: Entity-Aware News Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "13032-13042",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107102"}

@inproceedings{bb110813,
        AUTHOR = "Park, G. and Han, C. and Kim, D. and Yoon, W.J.",
        TITLE = "MHSAN: Multi-Head Self-Attention Network for Visual Semantic
Embedding",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1507-1515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107103"}

@inproceedings{bb110814,
        AUTHOR = "Chen, C. and Zhang, R. and Koh, E. and Kim, S. and Cohen, S. and Rossi, R.",
        TITLE = "Figure Captioning with Relation Maps for Reasoning",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1526-1534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107104"}

@inproceedings{bb110815,
        AUTHOR = "He, S. and Tavakoli, H.R. and Borji, A. and Pugeault, N.",
        TITLE = "Human Attention in Image Captioning: Dataset and Analysis",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8528-8537",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107105"}

@inproceedings{bb110816,
        AUTHOR = "Laina, I. and Rupprecht, C. and Navab, N.",
        TITLE = "Towards Unsupervised Image Captioning With Shared Multimodal
Embeddings",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "7413-7423",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107106"}

@inproceedings{bb110817,
        AUTHOR = "Huang, L. and Wang, W. and Chen, J. and Wei, X.",
        TITLE = "Attention on Attention for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4633-4642",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107107"}

@inproceedings{bb110818,
        AUTHOR = "Yang, X. and Zhang, H. and Cai, J.",
        TITLE = "Learning to Collocate Neural Modules for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4249-4259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107108"}

@inproceedings{bb110819,
        AUTHOR = "Yao, T. and Pan, Y. and Li, Y. and Mei, T.",
        TITLE = "Hierarchy Parsing for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "2621-2629",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107109"}

@inproceedings{bb110820,
        AUTHOR = "Liu, L. and Tang, J. and Wan, X. and Guo, Z.",
        TITLE = "Generating Diverse and Descriptive Image Captions Using Visual
Paraphrases",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4239-4248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107110"}

@inproceedings{bb110821,
        AUTHOR = "Ke, L. and Pei, W. and Li, R. and Shen, X. and Tai, Y.",
        TITLE = "Reflective Decoding Network for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8887-8896",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107111"}

@inproceedings{bb110822,
        AUTHOR = "Vered, G. and Oren, G. and Atzmon, Y. and Chechik, G.",
        TITLE = "Joint Optimization for Cooperative Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8897-8906",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107112"}

@inproceedings{bb110823,
        AUTHOR = "Ge, H. and Yan, Z. and Zhang, K. and Zhao, M. and Sun, L.",
        TITLE = "Exploring Overall Contextual Information for Image Captioning in
Human-Like Cognitive Style",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "1754-1763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107113"}

@inproceedings{bb110824,
        AUTHOR = "Agrawal, H. and Desai, K. and Wang, Y. and Chen, X. and Jain, R. and Johnson, M. and Batra, D. and Parikh, D. and Lee, S. and Anderson, P.",
        TITLE = "nocaps: novel object captioning at scale",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8947-8956",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107114"}

@inproceedings{bb110825,
        AUTHOR = "Li, G. and Zhu, L. and Liu, P. and Yang, Y.",
        TITLE = "Entangled Transformer for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8927-8936",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107115"}

@inproceedings{bb110826,
        AUTHOR = "Hu, H. and Misra, I. and van der Maaten, L.",
        TITLE = "Evaluating Text-to-Image Matching using Binary Image Selection
(BISON)",
        BOOKTITLE = CLVL19,
        YEAR = "2019",
        PAGES = "1887-1890",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107116"}

@inproceedings{bb110827,
        AUTHOR = "Nguyen, A. and Tran, Q.D. and Do, T. and Reid, I. and Caldwell, D.G. and Tsagarakis, N.G.",
        TITLE = "Object Captioning and Retrieval with Natural Language",
        BOOKTITLE = ACVR19,
        YEAR = "2019",
        PAGES = "2584-2592",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107117"}

@inproceedings{bb110828,
        AUTHOR = "Gu, J. and Joty, S. and Cai, J. and Zhao, H. and Yang, X. and Wang, G.",
        TITLE = "Unpaired Image Captioning via Scene Graph Alignments",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "10322-10331",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107118"}

@inproceedings{bb110829,
        AUTHOR = "Shen, T. and Kar, A. and Fidler, S.",
        TITLE = "Learning to Caption Images Through a Lifetime by Asking Questions",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "10392-10401",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107119"}

@inproceedings{bb110830,
        AUTHOR = "Tanaka, M. and Itamochi, T. and Narioka, K. and Sato, I. and Ushiku, Y. and Harada, T.",
        TITLE = "Generating Easy-to-Understand Referring Expressions for Target
Identifications",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "5793-5802",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107120"}

@inproceedings{bb110831,
        AUTHOR = "Aneja, J. and Agrawal, H. and Batra, D. and Schwing, A.G.",
        TITLE = "Sequential Latent Spaces for Modeling the Intention During Diverse
Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4260-4269",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107121"}

@inproceedings{bb110832,
        AUTHOR = "Gupta, T. and Schwing, A.G. and Hoiem, D.",
        TITLE = "ViCo: Word Embeddings From Visual Co-Occurrences",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "7424-7433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107122"}

@inproceedings{bb110833,
        AUTHOR = "Deshpande, A. and Aneja, J. and Wang, L. and Schwing, A.G. and Forsyth, D.",
        TITLE = "Fast, Diverse and Accurate Image Captioning Guided by Part-Of-Speech",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10687-10696",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107123"}

@inproceedings{bb110834,
        AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L.",
        TITLE = "Image Captioning Based on Visual and Semantic Attention",
        BOOKTITLE = MMMod20,
        YEAR = "2020",
        PAGES = "I:151-162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107124"}

@inproceedings{bb110835,
        AUTHOR = "Dognin, P. and Melnyk, I. and Mroueh, Y. and Ross, J. and Sercu, T.",
        TITLE = "Adversarial Semantic Alignment for Improved Image Captions",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10455-10463",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107125"}

@inproceedings{bb110836,
        AUTHOR = "Fukui, H. and Hirakawa, T. and Yamashita, T. and Fujiyoshi, H.",
        TITLE = "Attention Branch Network: Learning of Attention Mechanism for Visual
Explanation",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10697-10706",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107126"}

@inproceedings{bb110837,
        AUTHOR = "Biten, A.F. and Gomez, L. and Rusinol, M. and Karatzas, D.",
        TITLE = "Good News, Everyone! Context Driven Entity-Aware Captioning for News
Images",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12458-12467",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107127"}

@inproceedings{bb110838,
        AUTHOR = "Suris, D. and Epstein, D. and Ji, H. and Chang, S.F. and Vondrick, C.",
        TITLE = "Learning to Learn Words from Visual Scenes",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXIX: 434-452",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107128"}

@inproceedings{bb110839,
        AUTHOR = "Akbari, H. and Karaman, S. and Bhargava, S. and Chen, B. and Vondrick, C. and Chang, S.F.",
        TITLE = "Multi-Level Multimodal Common Semantic Space for Image-Phrase Grounding",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12468-12478",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107129"}

@inproceedings{bb110840,
        AUTHOR = "Bracha, L. and Chechik, G.",
        TITLE = "Informative Object Annotations: Tell Me Something I Don't Know",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12499-12507",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107130"}

@inproceedings{bb110841,
        AUTHOR = "Shuster, K. and Humeau, S. and Hu, H. and Bordes, A. and Weston, J.",
        TITLE = "Engaging Image Captioning via Personality",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12508-12518",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107131"}

@inproceedings{bb110842,
        AUTHOR = "Feng, Y. and Ma, L. and Liu, W. and Luo, J.B.",
        TITLE = "Unsupervised Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "4120-4129",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107132"}

@inproceedings{bb110843,
        AUTHOR = "Xu, Y. and Wu, B.Y. and Shen, F.M. and Fan, Y.B. and Zhang, Y. and Shen, H.T. and Liu, W.",
        TITLE = "Exact Adversarial Attack to Image Captioning via Structured Output
Learning With Latent Variables",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "4130-4139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107133"}

@inproceedings{bb110844,
        AUTHOR = "Wang, Q.Z. and Chan, A.B.",
        TITLE = "Describing Like Humans: On Diversity in Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "4190-4198",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107134"}

@inproceedings{bb110845,
        AUTHOR = "Guo, L.T. and Liu, J. and Yao, P. and Li, J.W. and Lu, H.Q.",
        TITLE = "MSCap: Multi-Style Image Captioning With Unpaired Stylized Text",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "4199-4208",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107135"}

@inproceedings{bb110846,
        AUTHOR = "Zhang, L. and Zhang, J.M. and Lin, Z. and Lu, H.C. and He, Y.",
        TITLE = "CapSal: Leveraging Captioning to Boost Semantics for Salient Object
Detection",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6017-6026",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107136"}

@inproceedings{bb110847,
        AUTHOR = "Yin, G.J. and Sheng, L. and Liu, B. and Yu, N.H. and Wang, X.G. and Shao, J.",
        TITLE = "Context and Attribute Grounded Dense Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6234-6243",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107137"}

@inproceedings{bb110848,
        AUTHOR = "Kim, D.J. and Choi, J. and Oh, T.H. and Kweon, I.S.",
        TITLE = "Dense Relational Captioning: Triple-Stream Networks for
Relationship-Based Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6264-6273",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107138"}

@inproceedings{bb110849,
        AUTHOR = "Gao, J.L. and Wang, S. and Wang, S.S. and Ma, S.W. and Gao, W.",
        TITLE = "Self-Critical N-Step Training for Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6293-6301",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107139"}

@inproceedings{bb110850,
        AUTHOR = "Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Show, Control and Tell: A Framework for Generating Controllable and
Grounded Captions",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8299-8308",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107140"}

@inproceedings{bb110851,
        AUTHOR = "Qin, Y. and Du, J.J. and Zhang, Y. and Lu, H.T.",
        TITLE = "Look Back and Predict Forward in Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8359-8367",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107141"}

@inproceedings{bb110852,
        AUTHOR = "Zheng, Y. and Li, Y. and Wang, S.J.",
        TITLE = "Intention Oriented Image Captions With Guiding Objects",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8387-8396",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107142"}

@inproceedings{bb110853,
        AUTHOR = "Huang, Y. and Li, C. and Li, T. and Wan, W. and Chen, J.",
        TITLE = "Image Captioning with Attribute Refinement",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1820-1824",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107143"}

@inproceedings{bb110854,
        AUTHOR = "Lee, J. and Lee, Y. and Seong, S. and Kim, K. and Kim, S. and Kim, J.",
        TITLE = "Capturing Long-Range Dependencies in Video Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1880-1884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107144"}

@inproceedings{bb110855,
        AUTHOR = "Shi, J. and Li, Y. and Wang, S.",
        TITLE = "Cascade Attention: Multiple Feature Based Learning for Image
Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1970-1974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107145"}

@inproceedings{bb110856,
        AUTHOR = "Wang, Y. and Shen, Y. and Xiong, H. and Lin, W.",
        TITLE = "Adaptive Hard Example Mining for Image Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3342-3346",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107146"}

@inproceedings{bb110857,
        AUTHOR = "Xiao, H. and Shi, J.",
        TITLE = "A Novel Attribute Selection Mechanism for Video Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "619-623",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107147"}

@inproceedings{bb110858,
        AUTHOR = "Lim, J.H. and Chan, C.S.",
        TITLE = "Mask Captioning Network",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107148"}

@inproceedings{bb110859,
        AUTHOR = "Wang, Q.Z. and Chan, A.B.",
        TITLE = "Gated Hierarchical Attention for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "IV:21-37",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107149"}

@inproceedings{bb110860,
        AUTHOR = "Wang, W. and Chen, Z.H. and Hu, H.F.",
        TITLE = "Multivariate Attention Network for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "VI:587-602",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107150"}

@inproceedings{bb110861,
        AUTHOR = "Ghanimifard, M. and Dobnik, S.",
        TITLE = "Knowing When to Look for What and Where: Evaluating Generation of
Spatial Descriptions with Adaptive Attention",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:153-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107151"}

@inproceedings{bb110862,
        AUTHOR = "Kim, B. and Lee, Y.H. and Jung, H. and Cho, C.",
        TITLE = "Distinctive-Attribute Extraction for Image Captioning",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:133-144",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107152"}

@inproceedings{bb110863,
        AUTHOR = "Tanti, M. and Gatt, A. and Muscat, A.",
        TITLE = "Pre-gen Metrics: Predicting Caption Quality Metrics Without Generating
Captions",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:114-123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107153"}

@inproceedings{bb110864,
        AUTHOR = "Tanti, M. and Gatt, A. and Camilleri, K.P.",
        TITLE = "Quantifying the Amount of Visual Information Used by Neural Caption
Generators",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:124-132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107154"}

@inproceedings{bb110865,
        AUTHOR = "Ren, L. and Qi, G. and Hua, K.",
        TITLE = "Improving Diversity of Image Captioning Through Variational
Autoencoders and Adversarial Learning",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "263-272",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107155"}

@inproceedings{bb110866,
        AUTHOR = "Zhou, Y. and Sun, Y. and Honavar, V.",
        TITLE = "Improving Image Captioning by Leveraging Knowledge Graphs",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "283-293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107156"}

@inproceedings{bb110867,
        AUTHOR = "Rapson, C.J. and Seet, B. and Naeem, M.A. and Lee, J.E. and Al Sarayreh, M. and Klette, R.",
        TITLE = "Reducing the Pain: A Novel Tool for Efficient Ground-Truth Labelling
in Images",
        BOOKTITLE = IVCNZ18,
        YEAR = "2018",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107157"}

@inproceedings{bb110868,
        AUTHOR = "Lu, J.S. and Yang, J.W. and Batra, D. and Parikh, D.",
        TITLE = "Neural Baby Talk",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7219-7228",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107158"}

@inproceedings{bb110869,
        AUTHOR = "Wu, B.Y. and Chen, W.D. and Sun, P. and Liu, W. and Ghanem, B. and Lyu, S.W.",
        TITLE = "Tagging Like Humans: Diverse and Distinct Image Annotation",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7967-7975",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107159"}

@inproceedings{bb110870,
        AUTHOR = "Wu, X.J. and Zhang, L. and Li, F.Z. and Wang, B.J.",
        TITLE = "A Novel Model for Multi-label Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "1953-1958",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107160"}

@inproceedings{bb110871,
        AUTHOR = "Jiu, M. and Sahbi, H. and Qi, L.",
        TITLE = "Deep Context Networks for Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2422-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107161"}

@inproceedings{bb110872,
        AUTHOR = "Khademi, M. and Schulte, O.",
        TITLE = "Image Caption Generation with Hierarchical Contextual Visual Spatial
Attention",
        BOOKTITLE = Cognitive18,
        YEAR = "2018",
        PAGES = "2024-20248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107162"}

@inproceedings{bb110873,
        AUTHOR = "Yan, S. and Wu, F. and Smith, J.S. and Lu, W. and Zhang, B.",
        TITLE = "Image Captioning using Adversarial Networks and Reinforcement
Learning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "248-253",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107163"}

@inproceedings{bb110874,
        AUTHOR = "Wang, F. and Gong, X. and Huang, L.",
        TITLE = "Time-Dependent Pre-attention Model for Image Captioning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3297-3302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107164"}

@inproceedings{bb110875,
        AUTHOR = "Luo, R. and Shakhnarovich, G. and Cohen, S. and Price, B.",
        TITLE = "Discriminability Objective for Training Descriptive Captions",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6964-6974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107165"}

@inproceedings{bb110876,
        AUTHOR = "Cui, Y. and Yang, G. and Veit, A. and Huang, X. and Belongie, S.",
        TITLE = "Learning to Evaluate Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5804-5812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107166"}

@inproceedings{bb110877,
        AUTHOR = "Aneja, J. and Deshpande, A. and Schwing, A.G.",
        TITLE = "Convolutional Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5561-5570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107167"}

@inproceedings{bb110878,
        AUTHOR = "Chen, F. and Ji, R. and Sun, X. and Wu, Y. and Su, J.",
        TITLE = "GroupCap: Group-Based Image Captioning with Structured Relevance and
Diversity Constraints",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1345-1353",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107168"}

@inproceedings{bb110879,
        AUTHOR = "Chen, X. and Ma, L. and Jiang, W. and Yao, J. and Liu, W.",
        TITLE = "Regularizing RNNs for Caption Generation by Reconstructing the Past
with the Present",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7995-8003",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107169"}

@inproceedings{bb110880,
        AUTHOR = "Yao, T. and Pan, Y.W. and Li, Y. and Mei, T.",
        TITLE = "Exploring Visual Relationship for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIV: 711-727",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107170"}

@inproceedings{bb110881,
        AUTHOR = "Shah, S.A.A.",
        TITLE = "NNEval: Neural Network Based Evaluation Metric for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 39-55",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107171"}

@inproceedings{bb110882,
        AUTHOR = "Jiang, W.H. and Ma, L. and Jiang, Y.G. and Liu, W. and Zhang, T.",
        TITLE = "Recurrent Fusion Network for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 510-526",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107172"}

@inproceedings{bb110883,
        AUTHOR = "Chatterjee, M. and Schwing, A.G.",
        TITLE = "Diverse and Coherent Paragraph Generation from Images",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 747-763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107173"}

@inproceedings{bb110884,
        AUTHOR = "Chen, S. and Zhao, Q.",
        TITLE = "Boosted Attention: Leveraging Human Attention for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XI: 72-88",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107174"}

@inproceedings{bb110885,
        AUTHOR = "Dai, B. and Ye, D. and Lin, D.",
        TITLE = "Rethinking the Form of Latent States in Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 294-310",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107175"}

@inproceedings{bb110886,
        AUTHOR = "Liu, X.H. and Li, H.S. and Shao, J. and Chen, D.P. and Wang, X.G.",
        TITLE = "Show, Tell and Discriminate:
Image Captioning by Self-retrieval with Partially Labeled Data",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 353-369",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107176"}

@inproceedings{bb110887,
        AUTHOR = "Fang, F. and Wang, H. and Tang, P.",
        TITLE = "Image Captioning with Word Level Attention",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "1278-1282",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107177"}

@inproceedings{bb110888,
        AUTHOR = "Zhu, Z. and Xue, Z. and Yuan, Z.",
        TITLE = "Topic-Guided Attention for Image Captioning",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2615-2619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107178"}

@inproceedings{bb110889,
        AUTHOR = "Gomez Garay, A. and Raducanu, B. and Salas, J.",
        TITLE = "Dense Captioning of Natural Scenes in Spanish",
        BOOKTITLE = MCPR18,
        YEAR = "2018",
        PAGES = "145-154",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107179"}

@inproceedings{bb110890,
        AUTHOR = "Yao, L. and Ballas, N. and Cho, K. and Smith, J. and Bengio, Y.",
        TITLE = "Oracle Performance for Visual Captioning",
        BOOKTITLE = BMVC16,
        YEAR = "2016",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107180"}

@inproceedings{bb110891,
        AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.",
        TITLE = "Post Rectifying Methods to Improve the Accuracy of Image Annotation",
        BOOKTITLE = DICTA17,
        YEAR = "2017",
        PAGES = "1-7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107181"}

@inproceedings{bb110892,
        AUTHOR = "Dong, H. and Zhang, J.Q. and McIlwraith, D. and Guo, Y.",
        TITLE = "I2T2I: Learning text to image synthesis with textual data
augmentation",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "2015-2019",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107182"}

@inproceedings{bb110893,
        AUTHOR = "Pellegrin, L. and Escalante, H.J. and Montes y Gomez, M. and Villegas, M. and Gonzalez, F.A.",
        TITLE = "A Flexible Framework for the Evaluation of Unsupervised Image
Annotation",
        BOOKTITLE = CIARP17,
        YEAR = "2017",
        PAGES = "508-516",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107183"}

@inproceedings{bb110894,
        AUTHOR = "Jia, Y.H. and Bai, L. and Wang, P. and Guo, J.L. and Xie, Y.X.",
        TITLE = "Deep Convolutional Neural Network for Correlating Images and Sentences",
        BOOKTITLE = MMMod18,
        YEAR = "2018",
        PAGES = "I:154-165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107184"}

@inproceedings{bb110895,
        AUTHOR = "Liu, J.Y. and Wang, L. and Yang, M.H.",
        TITLE = "Referring Expression Generation and Comprehension via Attributes",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "4866-4874",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107185"}

@inproceedings{bb110896,
        AUTHOR = "Dai, B. and Fidler, S. and Urtasun, R. and Lin, D.",
        TITLE = "Towards Diverse and Natural Image Descriptions via a Conditional GAN",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "2989-2998",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107186"}

@inproceedings{bb110897,
        AUTHOR = "Niu, Z.X. and Zhou, M. and Wang, L. and Gao, X. and Hua, G.",
        TITLE = "Hierarchical Multimodal LSTM for Dense Visual-Semantic Embedding",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1899-1907",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107187"}

@inproceedings{bb110898,
        AUTHOR = "Liang, X. and Hu, Z. and Zhang, H. and Gan, C. and Xing, E.P.",
        TITLE = "Recurrent Topic-Transition GAN for Visual Paragraph Generation",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "3382-3391",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107188"}

@inproceedings{bb110899,
        AUTHOR = "Shetty, R. and Rohrbach, M. and Hendricks, L.A. and Fritz, M. and Schiele, B.",
        TITLE = "Speaking the Same Language:
Matching Machine to Human Captions by Adversarial Training",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "4155-4164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT107189"}

Last update: