@inproceedings{bb120800,
        AUTHOR = "Takahashi, T. and Nakanishi, S. and Kuno, Y. and Shirai, Y.",
        TITLE = "Helping Computer Vision by Verbal and Nonverbal Communication",
        BOOKTITLE = ICPR98,
        YEAR = "1998",
        PAGES = "Vol II: 1216-1218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT116920"}

@inproceedings{bb120801,
        AUTHOR = "Satoh, S. and Nakamura, Y. and Kanade, T.",
        TITLE = "Name-It: Naming and Detecting Faces in Video by the Integration 
of Image and Natural Language Processing",
        BOOKTITLE = IJCAI97,
        YEAR = "1997",
        PAGES = "1488-1495",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT116921"}

@inproceedings{bb120802,
        AUTHOR = "Satoh, S. and Kanade, T.",
        TITLE = "Name-It: Association Of Face And Name In Video",
        BOOKTITLE = CVPR97,
        YEAR = "1997",
        PAGES = "368-373",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT116922"}

@inproceedings{bb120803,
        AUTHOR = "Socher, G. and Sagerer, G.F. and Kummert, F. and Fuhr, T.",
        TITLE = "Talking About 3D Scenes: Integration of Image and Speech Understanding
in a Hybrid Distributed System",
        BOOKTITLE = ICIP96,
        YEAR = "1996",
        PAGES = "II: 809-812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT116923"}

@article{bb120804,
        AUTHOR = "Kuniyoshi, Y. and Inaba, M. and Inoue, H.",
        TITLE = "Learning by Watching: Extracting Reusable Task Knowledge from
Visual Observation of Human Performance",
        JOURNAL = RA,
        VOLUME = "10",
        YEAR = "1994",
        PAGES = "799-822",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116924"}

@inproceedings{bb120805,
        AUTHOR = "Kuniyoshi, Y. and Inoue, H.",
        TITLE = "Indexicality and dynamic attention control in qualitative recognition
of assembly actions",
        BOOKTITLE = ECCV92,
        YEAR = "1992",
        PAGES = "874-878",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116925"}

@article{bb120806,
        AUTHOR = "Porway, J. and Wang, Q.C. and Zhu, S.C.",
        TITLE = "A Hierarchical and Contextual Model for Aerial Image Parsing",
        JOURNAL = IJCV,
        VOLUME = "88",
        YEAR = "2010",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116926"}

@inproceedings{bb120807,
        AUTHOR = "Porway, J. and Wang, K. and Yao, B. and Zhu, S.C.",
        TITLE = "A hierarchical and contextual model for aerial image understanding",
        BOOKTITLE = CVPR08,
        YEAR = "2008",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116927"}

@inproceedings{bb120808,
        AUTHOR = "Si, Z.Z. and Gong, H.F. and Wu, Y.N. and Zhu, S.C.",
        TITLE = "Learning mixed templates for object recognition",
        BOOKTITLE = CVPR09,
        YEAR = "2009",
        PAGES = "272-279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116928"}

@article{bb120809,
        AUTHOR = "Tu, Z.W. and Bai, X.",
        TITLE = "Auto-Context and Its Application to High-Level Vision Tasks and 3D
Brain Image Segmentation",
        JOURNAL = PAMI,
        VOLUME = "32",
        YEAR = "2010",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1744-1757",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116929"}

@inproceedings{bb120810,
        AUTHOR = "Tu, Z.W.",
        TITLE = "Auto-context and its application to high-level vision tasks",
        BOOKTITLE = CVPR08,
        YEAR = "2008",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116930"}

@inproceedings{bb120811,
        AUTHOR = "Jones, J. and Hager, G.D. and Khudanpur, S.",
        TITLE = "Toward Computer Vision Systems That Understand Real-World Assembly
Processes",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "426-434",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116931"}

@inproceedings{bb120812,
        AUTHOR = "Lampert, C.H.",
        TITLE = "Partitioning of image datasets using discriminative context information",
        BOOKTITLE = CVPR08,
        YEAR = "2008",
        PAGES = "1-8",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116932"}

@inproceedings{bb120813,
        AUTHOR = "Hansen, C. and Henderson, T.C.",
        TITLE = "Towards the Automatic Generation of Recognition Strategies",
        BOOKTITLE = ICCV88,
        YEAR = "1988",
        PAGES = "275-279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116933"}

@inproceedings{bb120814,
        AUTHOR = "Cantoni, V. and Cei, U. and Ferretti, M. and Lombardi, L.",
        TITLE = "Towards an Automatic Construction of Object Recognition Strategies",
        BOOKTITLE = ICPR88,
        YEAR = "1988",
        PAGES = "I: 371-374",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116934"}

@inproceedings{bb120815,
        AUTHOR = "Cova, G. and Griffini, A. and Lombardi, L.",
        TITLE = "Object Recognition Strategy in a Multi-Resolution System",
        BOOKTITLE = CIAP89,
        YEAR = "1989",
        PAGES = "729-733",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT116935"}

@article{bb120816,
        AUTHOR = "Feng, Y.S. and Lapata, M.",
        TITLE = "Automatic Caption Generation for News Images",
        JOURNAL = PAMI,
        VOLUME = "35",
        YEAR = "2013",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "797-812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116936"}

@article{bb120817,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Dense Sampling Low-Level Statistics of Local Features",
        JOURNAL = IEICE,
        VOLUME = "E93-D",
        YEAR = "2010",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1727-1736",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116937"}

@inproceedings{bb120818,
        AUTHOR = "Kuniyoshi, Y. and Harada, T. and Nakayama, H.",
        TITLE = "Dense Sampling Low-Level Statistics of Local Features",
        BOOKTITLE = CIVR09,
        YEAR = "2009",
        PAGES = "Article No 17",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116937"}

@inproceedings{bb120819,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Global Gaussian approach for scene categorization using information
geometry",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "2336-2343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116938"}

@inproceedings{bb120820,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "AI Goggles: Real-time Description and Retrieval in the Real World with
Online Learning",
        BOOKTITLE = CRV09,
        YEAR = "2009",
        PAGES = "184-191",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116939"}

@inproceedings{bb120821,
        AUTHOR = "Ushiku, Y. and Yamaguchi, M. and Mukuta, Y. and Harada, T.",
        TITLE = "Common Subspace for Model and Similarity:
Phrase Learning for Caption Generation from Images",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "2668-2676",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116940"}

@inproceedings{bb120822,
        AUTHOR = "Jin, J. and Nakayama, H.",
        TITLE = "Annotation order matters:
Recurrent Image Annotator for arbitrary length image tagging",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "2452-2457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116941"}

@inproceedings{bb120823,
        AUTHOR = "Harada, T. and Nakayama, H. and Kuniyoshi, Y.",
        TITLE = "Improving Local Descriptors by Embedding Global and Local Spatial
Information",
        BOOKTITLE = ECCV10,
        YEAR = "2010",
        PAGES = "IV: 736-749",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116942"}

@inproceedings{bb120824,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Evaluation of dimensionality reduction methods for image
auto-annotation",
        BOOKTITLE = BMVC10,
        YEAR = "2010",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116943"}

@article{bb120825,
        AUTHOR = "Tariq, A. and Foroosh, H.",
        TITLE = "A Context-Driven Extractive Framework for Generating Realistic Image
Descriptions",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "619-632",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116944"}

@article{bb120826,
        AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.",
        TITLE = "Show and Tell: Lessons Learned from the 2015 MSCOCO Image Captioning
Challenge",
        JOURNAL = PAMI,
        VOLUME = "39",
        YEAR = "2017",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "652-663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116945"}

@inproceedings{bb120827,
        AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.",
        TITLE = "Show and tell: A neural image caption generator",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "3156-3164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116946"}

@article{bb120828,
        AUTHOR = "Wang, J.Y. and Zhu, X.T. and Gong, S.G.",
        TITLE = "Discovering visual concept structure with sparse and incomplete tags",
        JOURNAL = AI,
        VOLUME = "250",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "16-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116947"}

@article{bb120829,
        AUTHOR = "Kilickaya, M. and Akkus, B.K. and Cakici, R. and Erdem, A. and Erdem, E. and Ikizler Cinbis, N.",
        TITLE = "Data-driven image captioning via salient region discovery",
        JOURNAL = IET-CV,
        VOLUME = "11",
        YEAR = "2017",
        NUMBER = "6",
        MONTH = "September",
        PAGES = "398-406",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116948"}

@article{bb120830,
        AUTHOR = "He, X.D. and Deng, L.",
        TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview",
        JOURNAL = SPMag,
        VOLUME = "34",
        YEAR = "2017",
        NUMBER = "6",
        MONTH = "November",
        PAGES = "109-116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116949"}

@article{bb120831,
        AUTHOR = "Deng, L. and He, X.D.",
        TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview",
        JOURNAL = SPMag,
        VOLUME = "35",
        YEAR = "2018",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116949"}

@article{bb120832,
        AUTHOR = "Li, L.H. and Tang, S. and Zhang, Y.D. and Deng, L.X. and Tian, Q.",
        TITLE = "GLA: Global-Local Attention for Image Description",
        JOURNAL = MultMed,
        VOLUME = "20",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "726-737",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116950"}

@article{bb120833,
        AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.",
        TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation",
        JOURNAL = GeoRS,
        VOLUME = "56",
        YEAR = "2018",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "2183-2195",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116951"}

@article{bb120834,
        AUTHOR = "Cheng, Q. and Zhang, Q. and Fu, P. and Tu, C.H. and Li, S.",
        TITLE = "A survey and analysis on automatic image annotation",
        JOURNAL = PR,
        VOLUME = "79",
        YEAR = "2018",
        PAGES = "242-259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116952"}

@article{bb120835,
        AUTHOR = "Ben Rejeb, I. and Ouni, S. and Barhoumi, W. and Zagrouba, E.",
        TITLE = "Fuzzy VA-Files for multi-label image annotation based on visual content
of regions",
        JOURNAL = SIViP,
        VOLUME = "12",
        YEAR = "2018",
        NUMBER = "5",
        MONTH = "July",
        PAGES = "877-884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116953"}

@article{bb120836,
        AUTHOR = "Helmy, T.",
        TITLE = "A Generic Framework for Semantic Annotation of Images",
        JOURNAL = IJIG,
        VOLUME = "18",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "July",
        PAGES = "Article 1850013",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116954"}

@article{bb120837,
        AUTHOR = "Wu, C.L. and Wei, Y.W. and Chu, X.L. and Su, F. and Wang, L.Q.",
        TITLE = "Modeling visual and word-conditional semantic attention for image
captioning",
        JOURNAL = SP:IC,
        VOLUME = "67",
        YEAR = "2018",
        PAGES = "100-107",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116955"}

@article{bb120838,
        AUTHOR = "Zhang, M. and Yang, Y. and Zhang, H. and Ji, Y. and Shen, H.T. and Chua, T.",
        TITLE = "More is Better: Precise and Detailed Image Captioning Using Online
Positive Recall and Missing Concepts Mining",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "32-44",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116956"}

@article{bb120839,
        AUTHOR = "Hu, J. and Lam, K.M. and Lou, P. and Liu, Q. and Deng, W.P.",
        TITLE = "Can a machine have two systems for recognition, like human beings?",
        JOURNAL = JVCIR,
        VOLUME = "56",
        YEAR = "2018",
        PAGES = "275-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116957"}

@article{bb120840,
        AUTHOR = "Bhagat, P.K. and Choudhary, P.",
        TITLE = "Image annotation: Then and now",
        JOURNAL = IVC,
        VOLUME = "80",
        YEAR = "2018",
        PAGES = "1-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116958"}

@article{bb120841,
        AUTHOR = "Bazrafkan, S. and Javidnia, H. and Corcoran, P.",
        TITLE = "Latent space mapping for generation of object elements with
corresponding data annotation",
        JOURNAL = PRL,
        VOLUME = "116",
        YEAR = "2018",
        PAGES = "179-186",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116959"}

@article{bb120842,
        AUTHOR = "Gella, S. and Keller, F. and Lapata, M.",
        TITLE = "Disambiguating Visual Verbs",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "311-322",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116960"}

@article{bb120843,
        AUTHOR = "Xu, N. and Liu, A.A. and Liu, J. and Nie, W.Z. and Su, Y.T.",
        TITLE = "Scene graph captioner:
Image captioning based on structural visual representation",
        JOURNAL = JVCIR,
        VOLUME = "58",
        YEAR = "2019",
        PAGES = "477-485",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116961"}

@article{bb120844,
        AUTHOR = "Jiu, M.Y. and Sahbi, H.",
        TITLE = "Deep representation design from deep kernel networks",
        JOURNAL = PR,
        VOLUME = "88",
        YEAR = "2019",
        PAGES = "447-457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116962"}

@article{bb120845,
        AUTHOR = "He, X.W. and Shi, B.G. and Bai, X. and Xia, G.S. and Zhang, Z.X. and Dong, W.S.",
        TITLE = "Image Caption Generation with Part of Speech Guidance",
        JOURNAL = PRL,
        VOLUME = "119",
        YEAR = "2019",
        PAGES = "229-237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116963"}

@article{bb120846,
        AUTHOR = "Xiao, X.Y. and Wang, L.F. and Ding, K. and Xiang, S.M. and Pan, C.",
        TITLE = "Dense semantic embedding network for image captioning",
        JOURNAL = PR,
        VOLUME = "90",
        YEAR = "2019",
        PAGES = "285-296",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116964"}

@article{bb120847,
        AUTHOR = "Foumani, S.N.M. and Nickabadi, A.",
        TITLE = "A probabilistic topic model using deep visual word representation for
simultaneous image classification and annotation",
        JOURNAL = JVCIR,
        VOLUME = "59",
        YEAR = "2019",
        PAGES = "195-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116965"}

@article{bb120848,
        AUTHOR = "Zhang, X.R. and Wang, X. and Tang, X. and Zhou, H.Y. and Li, C.",
        TITLE = "Description Generation for Remote Sensing Images Using Attribute
Attention Mechanism",
        JOURNAL = RS,
        VOLUME = "11",
        YEAR = "2019",
        NUMBER = "6",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116966"}

@article{bb120849,
        AUTHOR = "Ding, S.T. and Qu, S. and Xi, Y.L. and Sangaiah, A.K. and Wan, S.H.",
        TITLE = "Image caption generation with high-level image features",
        JOURNAL = PRL,
        VOLUME = "123",
        YEAR = "2019",
        PAGES = "89-95",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116967"}

@article{bb120850,
        AUTHOR = "Liu, X.X. and Xu, Q.Y. and Wang, N.",
        TITLE = "A survey on deep neural network-based image captioning",
        JOURNAL = VC,
        VOLUME = "35",
        YEAR = "2019",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "445-470",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116968"}

@article{bb120851,
        AUTHOR = "Hossain, M.Z. and Sohel, F. and Shiratuddin, M.F. and Laga, H.",
        TITLE = "A Comprehensive Survey of Deep Learning for Image Captioning",
        JOURNAL = Surveys,
        VOLUME = "51",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "February",
        PAGES = "Article No 118",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116969"}

@article{bb120852,
        AUTHOR = "Zhang, J.J. and Wu, Q. and Zhang, J. and Shen, C.H. and Lu, J.F. and Wu, Q.A.",
        TITLE = "Heritage image annotation via collective knowledge",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "204-214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116970"}

@article{bb120853,
        AUTHOR = "Verma, Y.",
        TITLE = "Diverse image annotation with missing labels",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "470-484",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116971"}

@article{bb120854,
        AUTHOR = "Markatopoulou, F. and Mezaris, V. and Patras, I.",
        TITLE = "Implicit and Explicit Concept Relations in Deep Neural Networks for
Multi-Label Video/Image Annotation",
        JOURNAL = CirSysVideo,
        VOLUME = "29",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1631-1644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116972"}

@article{bb120855,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "High-Quality Image Captioning With Fine-Grained and Semantic-Guided
Visual Attention",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1681-1693",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116973"}

@inproceedings{bb120856,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Fine-Grained and Semantic-Guided Visual Attention for Image
Captioning",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1709-1717",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116974"}

@article{bb120857,
        AUTHOR = "Laib, L. and Allili, M.S. and Ait Aoudia, S.",
        TITLE = "A probabilistic topic model for event-based image classification and
multi-label annotation",
        JOURNAL = SP:IC,
        VOLUME = "76",
        YEAR = "2019",
        PAGES = "283-294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116975"}

@article{bb120858,
        AUTHOR = "Olaode, A. and Naghdy, G.",
        TITLE = "Review of the application of machine learning to the automatic semantic
annotation of images",
        JOURNAL = IET-IPR,
        VOLUME = "13",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "1232-1245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116976"}

@article{bb120859,
        AUTHOR = "Li, X. and Jiang, S.",
        TITLE = "Know More Say Less: Image Captioning Based on Scene Graphs",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "2117-2130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116977"}

@article{bb120860,
        AUTHOR = "Zhang, C.J. and Cheng, J. and Tian, Q.",
        TITLE = "Multiview, Few-Labeled Object Categorization by Predicting Labels
With View Consistency",
        JOURNAL = Cyber,
        VOLUME = "49",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3834-3843",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116978"}

@article{bb120861,
        AUTHOR = "Sharif, N. and White, L. and Bennamoun, M. and Liu, W. and Shah, S.A.A.",
        TITLE = "LCEval: Learned Composite Metric for Caption Evaluation",
        JOURNAL = IJCV,
        VOLUME = "127",
        YEAR = "2019",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1586-1610",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116979"}

@article{bb120862,
        AUTHOR = "Zhang, Z.Y. and Diao, W.H. and Zhang, W.K. and Yan, M.L. and Gao, X. and Sun, X.",
        TITLE = "LAM: Remote Sensing Image Captioning with Label-Attention Mechanism",
        JOURNAL = RS,
        VOLUME = "11",
        YEAR = "2019",
        NUMBER = "20",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116980"}

@article{bb120863,
        AUTHOR = "Fu, K. and Li, Y. and Zhang, W.K. and Yu, H.F. and Sun, X.",
        TITLE = "Boosting Memory with a Persistent Memory Mechanism for Remote Sensing
Image Captioning",
        JOURNAL = RS,
        VOLUME = "12",
        YEAR = "2020",
        NUMBER = "11",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116981"}

@article{bb120864,
        AUTHOR = "Tan, J.H. and Chan, C.S. and Chuah, J.H.",
        TITLE = "COMIC: Toward A Compact Image Captioning Model With Attention",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2686-2696",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116982"}

@article{bb120865,
        AUTHOR = "Zhou, L. and Zhang, Y. and Jiang, Y. and Zhang, T. and Fan, W.",
        TITLE = "Re-Caption: Saliency-Enhanced Image Captioning Through Two-Phase
Learning",
        JOURNAL = IP,
        VOLUME = "29",
        YEAR = "2020",
        NUMBER = "1",
        PAGES = "694-709",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116983"}

@article{bb120866,
        AUTHOR = "Yang, L. and Hu, H.F.",
        TITLE = "Visual Skeleton and Reparative Attention for Part-of-Speech image
captioning system",
        JOURNAL = CVIU,
        VOLUME = "189",
        YEAR = "2019",
        PAGES = "102819",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116984"}

@article{bb120867,
        AUTHOR = "Wang, J.B. and Wang, W. and Wang, L. and Wang, Z.Y. and Feng, D.D. and Tan, T.N.",
        TITLE = "Learning Visual Relationship and Context-Aware Attention for Image
Captioning",
        JOURNAL = PR,
        VOLUME = "98",
        YEAR = "2020",
        PAGES = "107075",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116985"}

@article{bb120868,
        AUTHOR = "Xiao, X. and Wang, L. and Ding, K. and Xiang, S. and Pan, C.",
        TITLE = "Deep Hierarchical Encoder-Decoder Network for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "2942-2956",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116986"}

@article{bb120869,
        AUTHOR = "Jiang, T. and Zhang, Z. and Yang, Y.",
        TITLE = "Modeling coverage with semantic embedding for image caption generation",
        JOURNAL = VC,
        VOLUME = "35",
        YEAR = "2018",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "1655-1665",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116987"}

@article{bb120870,
        AUTHOR = "Tang, C. and Liu, X. and Wang, P. and Zhang, C. and Li, M. and Wang, L.",
        TITLE = "Adaptive Hypergraph Embedded Semi-Supervised Multi-Label Image
Annotation",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "2837-2849",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116988"}

@article{bb120871,
        AUTHOR = "Mundnich, K. and Booth, B.M. and Girault, B. and Narayanan, S.",
        TITLE = "Generating labels for regression of subjective constructs using
triplet embeddings",
        JOURNAL = PRL,
        VOLUME = "128",
        YEAR = "2019",
        PAGES = "385-392",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116989"}

@article{bb120872,
        AUTHOR = "Lu, X. and Wang, B. and Zheng, X.",
        TITLE = "Sound Active Attention Framework for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "58",
        YEAR = "2020",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "1985-2000",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116990"}

@article{bb120873,
        AUTHOR = "Li, Y.Y. and Fang, S.K. and Jiao, L.C. and Liu, R.J. and Shang, R.H.",
        TITLE = "A Multi-Level Attention Model for Remote Sensing Image Captions",
        JOURNAL = RS,
        VOLUME = "12",
        YEAR = "2020",
        NUMBER = "6",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116991"}

@article{bb120874,
        AUTHOR = "Chaudhary, C. and Goyal, P. and Prasad, D.N. and Chen, Y.P.",
        TITLE = "Enhancing the Quality of Image Tagging Using a Visio-Textual
Knowledge Base",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "897-911",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116992"}

@article{bb120875,
        AUTHOR = "Chen, X.H. and Zhang, M.X. and Wang, Z. and Zuo, L. and Li, B. and Yang, Y.",
        TITLE = "Leveraging unpaired out-of-domain data for image captioning",
        JOURNAL = PRL,
        VOLUME = "132",
        YEAR = "2020",
        PAGES = "132-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116993"}

@article{bb120876,
        AUTHOR = "Xu, N. and Zhang, H. and Liu, A. and Nie, W. and Su, Y. and Nie, J. and Zhang, Y.",
        TITLE = "Multi-Level Policy and Reward-Based Deep Reinforcement Learning
Framework for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1372-1383",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116994"}

@article{bb120877,
        AUTHOR = "Guo, L. and Liu, J. and Lu, S. and Lu, H.",
        TITLE = "Show, Tell, and Polish: Ruminant Decoding for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "2149-2162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116995"}

@article{bb120878,
        AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.",
        TITLE = "Architecture to improve the accuracy of automatic image annotation
systems",
        JOURNAL = IET-CV,
        VOLUME = "14",
        YEAR = "2020",
        NUMBER = "5",
        MONTH = "August",
        PAGES = "214-223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116996"}

@article{bb120879,
        AUTHOR = "Theodosiou, Z. and Tsapatsoulis, N.",
        TITLE = "Image annotation: the effects of content, lexicon and annotation method",
        JOURNAL = MultInfoRetr,
        VOLUME = "9",
        YEAR = "2020",
        NUMBER = "3",
        MONTH = "September",
        PAGES = "191-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116997"}

@article{bb120880,
        AUTHOR = "Feng, Q. and Wu, Y. and Fan, H. and Yan, C. and Xu, M. and Yang, Y.",
        TITLE = "Cascaded Revision Network for Novel Object Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "30",
        YEAR = "2020",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "3413-3421",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116998"}

@article{bb120881,
        AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L. and Ma, H.F.",
        TITLE = "The synergy of double attention: Combine sentence-level and
word-level attention for image captioning",
        JOURNAL = CVIU,
        VOLUME = "201",
        YEAR = "2020",
        PAGES = "103068",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT116999"}

@article{bb120882,
        AUTHOR = "Shilpa, M. and He, J. and Zhao, Y.J. and Sun, B. and Yu, L.J.",
        TITLE = "Feedback evaluations to promote image captioning",
        JOURNAL = IET-IPR,
        VOLUME = "14",
        YEAR = "2020",
        NUMBER = "13",
        MONTH = "November",
        PAGES = "3021-3027",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117000"}

@article{bb120883,
        AUTHOR = "Liu, H. and Zhang, S. and Lin, K. and Wen, J. and Li, J. and Hu, X.",
        TITLE = "Vocabulary-Wide Credit Assignment for Training Image Captioning
Models",
        JOURNAL = IP,
        VOLUME = "30",
        YEAR = "2021",
        PAGES = "2450-2460",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117001"}

@article{bb120884,
        AUTHOR = "Xu, N. and Tian, H.S. and Wang, Y.H. and Nie, W.Z. and Song, D. and Liu, A.A. and Liu, W.",
        TITLE = "Coupled-dynamic learning for vision and language:
Exploring Interaction between different tasks",
        JOURNAL = PR,
        VOLUME = "113",
        YEAR = "2021",
        PAGES = "107829",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117002"}

@article{bb120885,
        AUTHOR = "Yang, L. and Wang, H. and Tang, P. and Li, Q.",
        TITLE = "CaptionNet: A Tailor-made Recurrent Neural Network for Generating
Image Descriptions",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "835-845",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117003"}

@article{bb120886,
        AUTHOR = "Liu, A.A. and Wang, Y.H. and Xu, N. and Liu, S. and Li, X.",
        TITLE = "Scene-Graph-Guided message passing network for dense captioning",
        JOURNAL = PRL,
        VOLUME = "145",
        YEAR = "2021",
        PAGES = "187-193",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117004"}

@article{bb120887,
        AUTHOR = "Zhang, L. and Zhang, Y.S. and Zhao, X. and Zou, Z.X.",
        TITLE = "Image captioning via proximal policy optimization",
        JOURNAL = IVC,
        VOLUME = "108",
        YEAR = "2021",
        PAGES = "104126",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117005"}

@article{bb120888,
        AUTHOR = "Ji, J.Z. and Du, Z.R. and Zhang, X.D.",
        TITLE = "Divergent-convergent attention for image captioning",
        JOURNAL = PR,
        VOLUME = "115",
        YEAR = "2021",
        PAGES = "107928",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117006"}

@article{bb120889,
        AUTHOR = "Wei, Y.W. and Wu, C.L. and Jia, Z.Y. and Hu, X. and Guo, S. and Shi, H.T.",
        TITLE = "Past is important: Improved image captioning by looking back in time",
        JOURNAL = SP:IC,
        VOLUME = "94",
        YEAR = "2021",
        PAGES = "116183",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117007"}

@article{bb120890,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Exploring region relationships implicitly:
Image captioning with visual relationship attention",
        JOURNAL = IVC,
        VOLUME = "109",
        YEAR = "2021",
        PAGES = "104146",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117008"}

@article{bb120891,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Exploring Pairwise Relationships Adaptively From Linguistic Context
in Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "3101-3113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117009"}

@article{bb120892,
        AUTHOR = "Li, X.L. and Zhang, X.T. and Huang, W. and Wang, Q.",
        TITLE = "Truncation Cross Entropy Loss for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "5246-5257",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117010"}

@article{bb120893,
        AUTHOR = "Zhong, X. and Nie, G.Z. and Huang, W.X. and Liu, W.X. and Ma, B. and Lin, C.W.",
        TITLE = "Attention-guided image captioning with adaptive global and local
feature fusion",
        JOURNAL = JVCIR,
        VOLUME = "78",
        YEAR = "2021",
        PAGES = "103138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117011"}

@article{bb120894,
        AUTHOR = "Sumbul, G. and Nayak, S. and Demir, B.",
        TITLE = "SD-RSIC: Summarization-Driven Deep Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6922-6934",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117012"}

@article{bb120895,
        AUTHOR = "Wu, J. and Chen, T.S. and Wu, H.F. and Yang, Z. and Luo, G.C. and Lin, L.",
        TITLE = "Fine-Grained Image Captioning With Global-Local Discriminative
Objective",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "2413-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117013"}

@article{bb120896,
        AUTHOR = "Wu, L.X. and Xu, M. and Sang, L. and Yao, T. and Mei, T.",
        TITLE = "Noise Augmented Double-Stream Graph Convolutional Networks for Image
Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3118-3127",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117014"}

@article{bb120897,
        AUTHOR = "Nivedita, M. and Chandrashekar, P. and Mahapatra, S. and Phamila, Y.A.V. and Selvaperumal, S.K.",
        TITLE = "Image Captioning for Video Surveillance System using Neural Networks",
        JOURNAL = IJIG,
        VOLUME = "21",
        YEAR = "2021",
        NUMBER = "4",
        MONTH = "October",
        PAGES = "2150044",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117015"}

@article{bb120898,
        AUTHOR = "Haghighi, F. and Taher, M.R.H. and Zhou, Z.W. and Gotway, M.B. and Liang, J.M.",
        TITLE = "Transferable Visual Words: Exploiting the Semantics of Anatomical
Patterns for Self-Supervised Learning",
        JOURNAL = MedImg,
        VOLUME = "40",
        YEAR = "2021",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2857-2868",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117016"}

@article{bb120899,
        AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.",
        TITLE = "Word-Sentence Framework for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "10532-10543",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117017"}

Last update:Feb 29, 2024 at 09:13:14