@inproceedings{bb95500,
        AUTHOR = "Ren, L. and Qi, G. and Hua, K.",
        TITLE = "Improving Diversity of Image Captioning Through Variational
Autoencoders and Adversarial Learning",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "263-272",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92018"}

@inproceedings{bb95501,
        AUTHOR = "Zhou, Y. and Sun, Y. and Honavar, V.",
        TITLE = "Improving Image Captioning by Leveraging Knowledge Graphs",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "283-293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92019"}

@inproceedings{bb95502,
        AUTHOR = "Rapson, C.J. and Seet, B. and Naeem, M.A. and Lee, J.E. and Al Sarayreh, M. and Klette, R.",
        TITLE = "Reducing the Pain: A Novel Tool for Efficient Ground-Truth Labelling
in Images",
        BOOKTITLE = IVCNZ18,
        YEAR = "2018",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92020"}

@inproceedings{bb95503,
        AUTHOR = "Lu, J.S. and Yang, J.W. and Batra, D. and Parikh, D.",
        TITLE = "Neural Baby Talk",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7219-7228",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92021"}

@inproceedings{bb95504,
        AUTHOR = "Wu, B.Y. and Chen, W.D. and Sun, P. and Liu, W. and Ghanem, B. and Lyu, S.W.",
        TITLE = "Tagging Like Humans: Diverse and Distinct Image Annotation",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7967-7975",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92022"}

@inproceedings{bb95505,
        AUTHOR = "Wu, X.J. and Zhang, L. and Li, F.Z. and Wang, B.J.",
        TITLE = "A Novel Model for Multi-label Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "1953-1958",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92023"}

@inproceedings{bb95506,
        AUTHOR = "Jiu, M. and Sahbi, H. and Qi, L.",
        TITLE = "Deep Context Networks for Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2422-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92024"}

@inproceedings{bb95507,
        AUTHOR = "Khademi, M. and Schulte, O.",
        TITLE = "Image Caption Generation with Hierarchical Contextual Visual Spatial
Attention",
        BOOKTITLE = Cognitive18,
        YEAR = "2018",
        PAGES = "2024-20248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92025"}

@inproceedings{bb95508,
        AUTHOR = "Yan, S. and Wu, F. and Smith, J.S. and Lu, W. and Zhang, B.",
        TITLE = "Image Captioning using Adversarial Networks and Reinforcement
Learning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "248-253",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92026"}

@inproceedings{bb95509,
        AUTHOR = "Wang, F. and Gong, X. and Huang, L.",
        TITLE = "Time-Dependent Pre-attention Model for Image Captioning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3297-3302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92027"}

@inproceedings{bb95510,
        AUTHOR = "Luo, R. and Shakhnarovich, G. and Cohen, S. and Price, B.",
        TITLE = "Discriminability Objective for Training Descriptive Captions",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6964-6974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92028"}

@inproceedings{bb95511,
        AUTHOR = "Cui, Y. and Yang, G. and Veit, A. and Huang, X. and Belongie, S.",
        TITLE = "Learning to Evaluate Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5804-5812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92029"}

@inproceedings{bb95512,
        AUTHOR = "Aneja, J. and Deshpande, A. and Schwing, A.G.",
        TITLE = "Convolutional Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5561-5570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92030"}

@inproceedings{bb95513,
        AUTHOR = "Chen, F. and Ji, R. and Sun, X. and Wu, Y. and Su, J.",
        TITLE = "GroupCap: Group-Based Image Captioning with Structured Relevance and
Diversity Constraints",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1345-1353",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92031"}

@inproceedings{bb95514,
        AUTHOR = "Chen, X. and Ma, L. and Jiang, W. and Yao, J. and Liu, W.",
        TITLE = "Regularizing RNNs for Caption Generation by Reconstructing the Past
with the Present",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7995-8003",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92032"}

@inproceedings{bb95515,
        AUTHOR = "Yao, T. and Pan, Y.W. and Li, Y. and Mei, T.",
        TITLE = "Exploring Visual Relationship for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIV: 711-727",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92033"}

@inproceedings{bb95516,
        AUTHOR = "Shah, S.A.A.",
        TITLE = "NNEval: Neural Network Based Evaluation Metric for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 39-55",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92034"}

@inproceedings{bb95517,
        AUTHOR = "Jiang, W.H. and Ma, L. and Jiang, Y.G. and Liu, W. and Zhang, T.",
        TITLE = "Recurrent Fusion Network for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 510-526",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92035"}

@inproceedings{bb95518,
        AUTHOR = "Chatterjee, M. and Schwing, A.G.",
        TITLE = "Diverse and Coherent Paragraph Generation from Images",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 747-763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92036"}

@inproceedings{bb95519,
        AUTHOR = "Chen, S. and Zhao, Q.",
        TITLE = "Boosted Attention: Leveraging Human Attention for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XI: 72-88",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92037"}

@inproceedings{bb95520,
        AUTHOR = "Dai, B. and Ye, D. and Lin, D.",
        TITLE = "Rethinking the Form of Latent States in Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 294-310",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92038"}

@inproceedings{bb95521,
        AUTHOR = "Liu, X. and Li, H.S. and Shao, J. and Chen, D.P. and Wang, X.G.",
        TITLE = "Show, Tell and Discriminate:
Image Captioning by Self-retrieval with Partially Labeled Data",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 353-369",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92039"}

@inproceedings{bb95522,
        AUTHOR = "Fang, F. and Wang, H. and Tang, P.",
        TITLE = "Image Captioning with Word Level Attention",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "1278-1282",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92040"}

@inproceedings{bb95523,
        AUTHOR = "Zhu, Z. and Xue, Z. and Yuan, Z.",
        TITLE = "Topic-Guided Attention for Image Captioning",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2615-2619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92041"}

@inproceedings{bb95524,
        AUTHOR = "Gomez Garay, A. and Raducanu, B. and Salas, J.",
        TITLE = "Dense Captioning of Natural Scenes in Spanish",
        BOOKTITLE = MCPR18,
        YEAR = "2018",
        PAGES = "145-154",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92042"}

@inproceedings{bb95525,
        AUTHOR = "Yao, L. and Ballas, N. and Cho, K. and Smith, J. and Bengio, Y.",
        TITLE = "Oracle Performance for Visual Captioning",
        BOOKTITLE = BMVC16,
        YEAR = "2016",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92043"}

@inproceedings{bb95526,
        AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.",
        TITLE = "Post Rectifying Methods to Improve the Accuracy of Image Annotation",
        BOOKTITLE = DICTA17,
        YEAR = "2017",
        PAGES = "1-7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92044"}

@inproceedings{bb95527,
        AUTHOR = "Dong, H. and Zhang, J.Q. and McIlwraith, D. and Guo, Y.",
        TITLE = "I2T2I: Learning text to image synthesis with textual data
augmentation",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "2015-2019",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92045"}

@inproceedings{bb95528,
        AUTHOR = "Pellegrin, L. and Escalante, H.J. and Montes y Gomez, M. and Villegas, M. and Gonzalez, F.A.",
        TITLE = "A Flexible Framework for the Evaluation of Unsupervised Image
Annotation",
        BOOKTITLE = CIARP17,
        YEAR = "2017",
        PAGES = "508-516",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92046"}

@inproceedings{bb95529,
        AUTHOR = "Jia, Y.H. and Bai, L. and Wang, P. and Guo, J.L. and Xie, Y.X.",
        TITLE = "Deep Convolutional Neural Network for Correlating Images and Sentences",
        BOOKTITLE = MMMod18,
        YEAR = "2018",
        PAGES = "I:154-165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92047"}

@inproceedings{bb95530,
        AUTHOR = "Liu, J.Y. and Wang, L. and Yang, M.H.",
        TITLE = "Referring Expression Generation and Comprehension via Attributes",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "4866-4874",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92048"}

@inproceedings{bb95531,
        AUTHOR = "Dai, B. and Fidler, S. and Urtasun, R. and Lin, D.",
        TITLE = "Towards Diverse and Natural Image Descriptions via a Conditional GAN",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "2989-2998",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92049"}

@inproceedings{bb95532,
        AUTHOR = "Niu, Z.X. and Zhou, M. and Wang, L. and Gao, X. and Hua, G.",
        TITLE = "Hierarchical Multimodal LSTM for Dense Visual-Semantic Embedding",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1899-1907",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92050"}

@inproceedings{bb95533,
        AUTHOR = "Liang, X. and Hu, Z. and Zhang, H. and Gan, C. and Xing, E.P.",
        TITLE = "Recurrent Topic-Transition GAN for Visual Paragraph Generation",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "3382-3391",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92051"}

@inproceedings{bb95534,
        AUTHOR = "Shetty, R. and Rohrbach, M. and Hendricks, L.A. and Fritz, M. and Schiele, B.",
        TITLE = "Speaking the Same Language:
Matching Machine to Human Captions by Adversarial Training",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "4155-4164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92052"}

@inproceedings{bb95535,
        AUTHOR = "Liu, S. and Zhu, Z. and Ye, N. and Guadarrama, S. and Murphy, K.",
        TITLE = "Improved Image Captioning via Policy Gradient optimization of SPIDEr",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "873-881",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92053"}

@inproceedings{bb95536,
        AUTHOR = "Gu, J.X. and Joty, S. and Cai, J.F. and Wang, G.",
        TITLE = "Unpaired Image Captioning by Language Pivoting",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "I: 519-535",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92054"}

@inproceedings{bb95537,
        AUTHOR = "Gu, J.X. and Wang, G. and Cai, J.F. and Chen, T.",
        TITLE = "An Empirical Study of Language CNN for Image Captioning",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1231-1240",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92055"}

@inproceedings{bb95538,
        AUTHOR = "Pedersoli, M. and Lucas, T. and Schmid, C. and Verbeek, J.",
        TITLE = "Areas of Attention for Image Captioning",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1251-1259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92056"}

@inproceedings{bb95539,
        AUTHOR = "Li, Y. and Ouyang, W. and Zhou, B. and Wang, K. and Wang, X.",
        TITLE = "Scene Graph Generation from Objects, Phrases and Region Captions",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1270-1279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92057"}

@inproceedings{bb95540,
        AUTHOR = "Zhang, Z. and Wu, J.J. and Li, Q. and Huang, Z. and Traer, J. and McDermott, J.H. and Tenenbaum, J.B. and Freeman, W.T.",
        TITLE = "Generative Modeling of Audible Shapes for Object Perception",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1260-1269",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92058"}

@inproceedings{bb95541,
        AUTHOR = "Liu, Z.J. and Freeman, W.T. and Tenenbaum, J.B. and Wu, J.J.",
        TITLE = "Physical Primitive Decomposition",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XII: 3-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92059"}

@inproceedings{bb95542,
        AUTHOR = "Wu, J.J. and Lim, J. and Zhang, H.Y. and Tenenbaum, J.B. and Freeman, W.T.",
        TITLE = "Physics 101: Learning Physical Object Properties from Unlabeled Videos",
        BOOKTITLE = BMVC16,
        YEAR = "2016",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92060"}

@inproceedings{bb95543,
        AUTHOR = "Tavakoliy, H.R. and Shetty, R. and Borji, A. and Laaksonen, J.",
        TITLE = "Paying Attention to Descriptions Generated by Image Captioning Models",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "2506-2515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92061"}

@inproceedings{bb95544,
        AUTHOR = "Chen, T.H. and Liao, Y.H. and Chuang, C.Y. and Hsu, W.T. and Fu, J. and Sun, M.",
        TITLE = "Show, Adapt and Tell:
Adversarial Training of Cross-Domain Image Captioner",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "521-530",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92062"}

@inproceedings{bb95545,
        AUTHOR = "Tripathi, A. and Gupta, A. and Chaudhary, S. and Lall, B.",
        TITLE = "Image Annotation Using Latent Components and Transmedia Association",
        BOOKTITLE = PReMI17,
        YEAR = "2017",
        PAGES = "493-500",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92063"}

@inproceedings{bb95546,
        AUTHOR = "Pini, S. and Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Towards Video Captioning with Naming:
A Novel Dataset and a Multi-modal Approach",
        BOOKTITLE = CIAP17,
        YEAR = "2017",
        PAGES = "II:384-395",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92064"}

@inproceedings{bb95547,
        AUTHOR = "Wu, B.Y. and Jia, F. and Liu, W. and Ghanem, B.",
        TITLE = "Diverse Image Annotation",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6194-6202",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92065"}

@inproceedings{bb95548,
        AUTHOR = "Krause, J. and Johnson, J. and Krishna, R. and Fei Fei, L.",
        TITLE = "A Hierarchical Approach for Generating Descriptive Image Paragraphs",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3337-3345",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92066"}

@inproceedings{bb95549,
        AUTHOR = "Vedantam, R. and Bengio, S. and Murphy, K. and Parikh, D. and Chechik, G.",
        TITLE = "Context-Aware Captions from Context-Agnostic Supervision",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1070-1079",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92067"}

@inproceedings{bb95550,
        AUTHOR = "Gan, Z. and Gan, C. and He, X. and Pu, Y. and Tran, K. and Gao, J. and Carin, L. and Deng, L.",
        TITLE = "Semantic Compositional Networks for Visual Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1141-1150",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92068"}

@inproceedings{bb95551,
        AUTHOR = "Ren, Z. and Wang, X. and Zhang, N. and Lv, X. and Li, L.J.",
        TITLE = "Deep Reinforcement Learning-Based Image Captioning with Embedding
Reward",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1151-1159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92069"}

@inproceedings{bb95552,
        AUTHOR = "Rennie, S.J. and Marcheret, E. and Mroueh, Y. and Ross, J. and Goel, V.",
        TITLE = "Self-Critical Sequence Training for Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1179-1195",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92070"}

@inproceedings{bb95553,
        AUTHOR = "Yang, L. and Tang, K. and Yang, J. and Li, L.J.",
        TITLE = "Dense Captioning with Joint Inference and Visual Context",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1978-1987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92071"}

@inproceedings{bb95554,
        AUTHOR = "Lu, J. and Xiong, C. and Parikh, D. and Socher, R.",
        TITLE = "Knowing When to Look: Adaptive Attention via a Visual Sentinel for
Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3242-3250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92072"}

@inproceedings{bb95555,
        AUTHOR = "Yao, T. and Pan, Y. and Li, Y. and Mei, T.",
        TITLE = "Incorporating Copying Mechanism in Image Captioning for Learning
Novel Objects",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "5263-5271",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92073"}

@inproceedings{bb95556,
        AUTHOR = "Chen, L. and Zhang, H. and Xiao, J. and Nie, L. and Shao, J. and Liu, W. and Chua, T.S.",
        TITLE = "SCA-CNN: Spatial and Channel-Wise Attention in Convolutional Networks
for Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6298-6306",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92074"}

@inproceedings{bb95557,
        AUTHOR = "Sun, Q. and Lee, S. and Batra, D.",
        TITLE = "Bidirectional Beam Search: Forward-Backward Inference in Neural
Sequence Models for Fill-in-the-Blank Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "7215-7223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92075"}

@inproceedings{bb95558,
        AUTHOR = "Wang, Y. and Lin, Z. and Shen, X. and Cohen, S. and Cottrell, G.W.",
        TITLE = "Skeleton Key: Image Captioning by Skeleton-Attribute Decomposition",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "7378-7387",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92076"}

@inproceedings{bb95559,
        AUTHOR = "Zanfir, M. and Marinoiu, E. and Sminchisescu, C.",
        TITLE = "Spatio-Temporal Attention Models for Grounded Video Captioning",
        BOOKTITLE = ACCV16,
        YEAR = "2016",
        PAGES = "IV: 104-119",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92077"}

@inproceedings{bb95560,
        AUTHOR = "Chen, T.H. and Zeng, K.H. and Hsu, W.T. and Sun, M.",
        TITLE = "Video Captioning via Sentence Augmentation and Spatio-Temporal
Attention",
        BOOKTITLE = Assist16,
        YEAR = "2016",
        PAGES = "I: 269-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92078"}

@inproceedings{bb95561,
        AUTHOR = "Tan, Y.H. and Chan, C.S.",
        TITLE = "phi-LSTM: A Phrase-Based Hierarchical LSTM Model for Image Captioning",
        BOOKTITLE = ACCV16,
        YEAR = "2016",
        PAGES = "V: 101-117",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92079"}

@inproceedings{bb95562,
        AUTHOR = "Weiland, L. and Hulpus, I. and Ponzetto, S.P. and Dietz, L.",
        TITLE = "Using Object Detection, NLP, and Knowledge Bases to Understand the
Message of Images",
        BOOKTITLE = MMMod17,
        YEAR = "2017",
        PAGES = "II: 405-418",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92080"}

@inproceedings{bb95563,
        AUTHOR = "Liu, Y. and Guo, Y.M. and Lew, M.S.",
        TITLE = "What Convnets Make for Image Captioning?",
        BOOKTITLE = MMMod17,
        YEAR = "2017",
        PAGES = "I: 416-428",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92081"}

@inproceedings{bb95564,
        AUTHOR = "Tran, K. and He, X. and Zhang, L. and Sun, J.",
        TITLE = "Rich Image Captioning in the Wild",
        BOOKTITLE = DeepLearn-C16,
        YEAR = "2016",
        PAGES = "434-441",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92082"}

@inproceedings{bb95565,
        AUTHOR = "Wang, Y.L. and Wang, S.H. and Tang, J.L. and Liu, H. and Li, B.X.",
        TITLE = "PPP: Joint Pointwise and Pairwise Image Label Prediction",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "6005-6013",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92083"}

@inproceedings{bb95566,
        AUTHOR = "Yatskar, M. and Ordonez, V. and Zettlemoyer, L. and Farhadi, A.",
        TITLE = "Commonly Uncommon: Semantic Sparsity in Situation Recognition",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6335-6344",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92084"}

@inproceedings{bb95567,
        AUTHOR = "Yatskar, M. and Zettlemoyer, L. and Farhadi, A.",
        TITLE = "Situation Recognition: Visual Semantic Role Labeling for Image
Understanding",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "5534-5542",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92085"}

@inproceedings{bb95568,
        AUTHOR = "Kottur, S. and Vedantam, R. and Moura, J.M.F. and Parikh, D.",
        TITLE = "VisualWord2Vec (Vis-W2V):
Learning Visually Grounded Word Embeddings Using Abstract Scenes",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4985-4994",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92086"}

@inproceedings{bb95569,
        AUTHOR = "Zhu, Y. and Groth, O. and Bernstein, M. and Fei Fei, L.",
        TITLE = "Visual7W: Grounded Question Answering in Images",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4995-5004",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92087"}

@inproceedings{bb95570,
        AUTHOR = "Zhang, P. and Goyal, Y. and Summers Stay, D. and Batra, D. and Parikh, D.",
        TITLE = "Yin and Yang: Balancing and Answering Binary Visual Questions",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "5014-5022",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92088"}

@inproceedings{bb95571,
        AUTHOR = "Venugopalan, S. and Hendricks, L.A. and Rohrbach, M. and Mooney, R. and Darrell, T.J. and Saenko, K.",
        TITLE = "Captioning Images with Diverse Objects",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1170-1178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92089"}

@inproceedings{bb95572,
        AUTHOR = "Hendricks, L.A. and Venugopalan, S. and Rohrbach, M. and Mooney, R. and Saenko, K. and Darrell, T.J.",
        TITLE = "Deep Compositional Captioning: Describing Novel Object Categories
without Paired Training Data",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "1-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92090"}

@inproceedings{bb95573,
        AUTHOR = "Johnson, J. and Karpathy, A. and Fei Fei, L.",
        TITLE = "DenseCap:
Fully Convolutional Localization Networks for Dense Captioning",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4565-4574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92091"}

@inproceedings{bb95574,
        AUTHOR = "Wang, M. and Song, L. and Yang, X.K. and Luo, C.F.",
        TITLE = "A parallel-fusion RNN-LSTM architecture for image caption generation",
        BOOKTITLE = ICIP16,
        YEAR = "2016",
        PAGES = "4448-4452",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92092"}

@inproceedings{bb95575,
        AUTHOR = "Lin, X. and Parikh, D.",
        TITLE = "Leveraging Visual Question Answering for Image-Caption Ranking",
        BOOKTITLE = ECCV16,
        YEAR = "2016",
        PAGES = "II: 261-277",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92093"}

@inproceedings{bb95576,
        AUTHOR = "Lin, X. and Parikh, D.",
        TITLE = "Don't just listen, use your imagination:
Leveraging visual common sense for non-visual tasks",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "2984-2993",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92094"}

@inproceedings{bb95577,
        AUTHOR = "Chen, T.L. and Zhang, Z.P. and You, Q.Z. and Fang, C. and Wang, Z.W. and Jin, H.L. and Luo, J.B.",
        TITLE = "'Factual' or 'Emotional':
Stylized Image Captioning with Adaptive Learning and Attention",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "X: 527-543",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92095"}

@inproceedings{bb95578,
        AUTHOR = "You, Q.Z. and Jin, H.L. and Wang, Z.W. and Fang, C. and Luo, J.B.",
        TITLE = "Image Captioning with Semantic Attention",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4651-4659",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92096"}

@inproceedings{bb95579,
        AUTHOR = "Jia, X. and Gavves, E. and Fernando, B. and Tuytelaars, T.",
        TITLE = "Guiding the Long-Short Term Memory Model for Image Caption Generation",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "2407-2415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92097"}

@inproceedings{bb95580,
        AUTHOR = "Chen, X.L. and Zitnick, C.L.",
        TITLE = "Mind's eye:
A recurrent visual representation for image caption generation",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "2422-2431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92098"}

@inproceedings{bb95581,
        AUTHOR = "Vedantam, R. and Zitnick, C.L. and Parikh, D.",
        TITLE = "CIDEr: Consensus-based image description evaluation",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "4566-4575",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92099"}

@inproceedings{bb95582,
        AUTHOR = "Fang, H. and Gupta, S. and Iandola, F. and Srivastava, R.K. and Deng, L. and Dollar, P. and Gao, J.F. and He, X.D. and Mitchell, M. and Platt, J.C. and Zitnick, C.L. and Zweig, G.",
        TITLE = "From captions to visual concepts and back",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "1473-1482",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92100"}

@inproceedings{bb95583,
        AUTHOR = "Ramnath, K. and Baker, S. and Vanderwende, L. and El Saban, M. and Sinha, S.N. and Kannan, A. and Hassan, N. and Galley, M. and Yang, Y. and Ramanan, D. and Bergamo, A. and Torresani, L.",
        TITLE = "AutoCaption: Automatic caption generation for personal photos",
        BOOKTITLE = WACV14,
        YEAR = "2014",
        PAGES = "1050-1057",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92101"}

@inproceedings{bb95584,
        AUTHOR = "Pan, J.Y. and Yang, H.J. and Faloutsos, C.",
        TITLE = "MMSS: Graph-based Multi-modal Story-oriented Video Summarization and
Retrieval",
        BOOKTITLE = CMU-CS-TR,
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92102"}

@inproceedings{bb95585,
        AUTHOR = "Pan, J.Y. and Yang, H.J. and Faloutsos, C. and Duygulu, P.",
        TITLE = "GCap: Graph-based Automatic Image Captioning",
        BOOKTITLE = MMDE04,
        YEAR = "2004",
        PAGES = "146",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92103"}

@inproceedings{bb95586,
        AUTHOR = "Pan, J.Y.",
        TITLE = "Advanced Tools for Video and Multimedia Mining",
        BOOKTITLE = CMU-CS,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92104"}

@inproceedings{bb95587,
        AUTHOR = "Pan, J.Y.",
        TITLE = "Advanced Tools for Video and Multimedia Mining",
        BOOKTITLE = Ph.D.,
        YEAR = "2006",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT92104"}

@article{bb95588,
        AUTHOR = "Suetens, P. and Fua, P.V. and Hanson, A.J.",
        TITLE = "Some Computational Strategies for Object Recognition",
        JOURNAL = Surveys,
        VOLUME = "24",
        YEAR = "1992",
        NUMBER = "1",
        MONTH = "March",
        PAGES = "5-62",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92105"}

@article{bb95589,
        AUTHOR = "Lindenbaum, M.",
        TITLE = "Bounds on Shape-Recognition Performance",
        JOURNAL = PAMI,
        VOLUME = "17",
        YEAR = "1995",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "666-680",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92106"}

@article{bb95590,
        AUTHOR = "Lindenbaum, M. and Ben David, S.",
        TITLE = "VC-Dimension Analysis of Object Recognition Tasks",
        JOURNAL = JMIV,
        VOLUME = "10",
        YEAR = "1999",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "27-49",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92107"}

@inproceedings{bb95591,
        AUTHOR = "Lindenbaum, M. and Ben David, S.",
        TITLE = "Applying VC-Dimension Analysis to Object Recognition",
        BOOKTITLE = ECCV94,
        YEAR = "1994",
        PAGES = "A:237-250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92108"}

@inproceedings{bb95592,
        AUTHOR = "Lindenbaum, M. and Ben David, S.",
        TITLE = "Applying VC-Dimension Analysis to 3D Object Recognition from
Perspective Projections",
        BOOKTITLE = AAAI-94,
        YEAR = "1994",
        PAGES = "985-991",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92109"}

@article{bb95593,
        AUTHOR = "Shum, H.Y. and Ikeuchi, K. and Reddy, R.",
        TITLE = "Principal Component Analysis with Missing Data and Its
Application to Polyhedral Object Modeling",
        JOURNAL = PAMI,
        VOLUME = "17",
        YEAR = "1995",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "854-867",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92110"}

@inproceedings{bb95594,
        AUTHOR = "Reddy, R. and Ikeuchi, K. and Shum, H.Y.",
        TITLE = "Principal Component Analysis with Missing Data and Its
Application to Polyhedral Object Modeling",
        BOOKTITLE = MfR01,
        YEAR = "2001",
        PAGES = "Chapter I-1",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92110"}

@inproceedings{bb95595,
        AUTHOR = "Shum, H.Y. and Ikeuchi, K. and Reddy, R.",
        TITLE = "Principal Component Analysis with Missing Data and Its
Application to Object Modeling",
        BOOKTITLE = CVPR94,
        YEAR = "1994",
        PAGES = "560-565",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92111"}

@inproceedings{bb95596,
        AUTHOR = "Shum, H.Y. and Ikeuchi, K. and Reddy, R.",
        TITLE = "Virtual Reality Modeling from a Sequence of Range Images",
        BOOKTITLE = ARPA94,
        YEAR = "1994",
        PAGES = "II:1189-1198",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92112"}

@article{bb95597,
        AUTHOR = "Liu, G. and Haralick, R.M.",
        TITLE = "Optimal matching problem in detection and recognition:
Performance Evaluation",
        JOURNAL = PR,
        VOLUME = "35",
        YEAR = "2002",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2125-2139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92113"}

@article{bb95598,
        AUTHOR = "Kay, S.M. and Gabriel, J.R.",
        TITLE = "An invariance property of the generalized likelihood ratio test",
        JOURNAL = SPLetters,
        VOLUME = "10",
        YEAR = "2003",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "352-355",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92114"}

@article{bb95599,
        AUTHOR = "Li, H.Z. and Liu, Z.Q.A. and Zhu, X.H.",
        TITLE = "Hidden Markov models with factored Gaussian mixtures densities",
        JOURNAL = PR,
        VOLUME = "38",
        YEAR = "2005",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "2022-2031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607.html#TT92115"}

Last update:Oct 1, 2019 at 15:23:24