@inproceedings{bb114600, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "Global Gaussian approach for scene categorization using information geometry", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "2336-2343", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110826"} @inproceedings{bb114601, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "AI Goggles: Real-time Description and Retrieval in the Real World with Online Learning", BOOKTITLE = CRV09, YEAR = "2009", PAGES = "184-191", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110827"} @inproceedings{bb114602, AUTHOR = "Ushiku, Y. and Yamaguchi, M. and Mukuta, Y. and Harada, T.", TITLE = "Common Subspace for Model and Similarity: Phrase Learning for Caption Generation from Images", BOOKTITLE = ICCV15, YEAR = "2015", PAGES = "2668-2676", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110828"} @inproceedings{bb114603, AUTHOR = "Jin, J. and Nakayama, H.", TITLE = "Annotation order matters: Recurrent Image Annotator for arbitrary length image tagging", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2452-2457", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110829"} @inproceedings{bb114604, AUTHOR = "Harada, T. and Nakayama, H. and Kuniyoshi, Y.", TITLE = "Improving Local Descriptors by Embedding Global and Local Spatial Information", BOOKTITLE = ECCV10, YEAR = "2010", PAGES = "IV: 736-749", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110830"} @inproceedings{bb114605, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "Evaluation of dimensionality reduction methods for image auto-annotation", BOOKTITLE = BMVC10, YEAR = "2010", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110831"} @article{bb114606, AUTHOR = "Tariq, A. and Foroosh, H.", TITLE = "A Context-Driven Extractive Framework for Generating Realistic Image Descriptions", JOURNAL = IP, VOLUME = "26", YEAR = "2017", NUMBER = "2", MONTH = "February", PAGES = "619-632", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110832"} @article{bb114607, AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.", TITLE = "Show and Tell: Lessons Learned from the 2015 MSCOCO Image Captioning Challenge", JOURNAL = PAMI, VOLUME = "39", YEAR = "2017", NUMBER = "4", MONTH = "April", PAGES = "652-663", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110833"} @inproceedings{bb114608, AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.", TITLE = "Show and tell: A neural image caption generator", BOOKTITLE = CVPR15, YEAR = "2015", PAGES = "3156-3164", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110834"} @article{bb114609, AUTHOR = "Gao, L.L. and Guo, Z. and Zhang, H.W. and Xu, X. and Shen, H.T.", TITLE = "Video Captioning With Attention-Based LSTM and Semantic Consistency", JOURNAL = MultMed, VOLUME = "19", YEAR = "2017", NUMBER = "9", MONTH = "September", PAGES = "2045-2055", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110835"} @article{bb114610, AUTHOR = "Hu, M. and Yang, Y. and Shen, F. and Zhang, L. and Shen, H.T. and Li, X.", TITLE = "Robust Web Image Annotation via Exploring Multi-Facet and Structural Knowledge", JOURNAL = IP, VOLUME = "26", YEAR = "2017", NUMBER = "10", MONTH = "October", PAGES = "4871-4884", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110836"} @article{bb114611, AUTHOR = "Bin, Y. and Yang, Y. and Shen, F. and Xie, N. and Shen, H.T. and Li, X.", TITLE = "Describing Video With Attention-Based Bidirectional LSTM", JOURNAL = Cyber, VOLUME = "49", YEAR = "2019", NUMBER = "7", MONTH = "July", PAGES = "2631-2641", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110837"} @article{bb114612, AUTHOR = "Wang, J.Y. and Zhu, X.T. and Gong, S.G.", TITLE = "Discovering visual concept structure with sparse and incomplete tags", JOURNAL = AI, VOLUME = "250", YEAR = "2017", NUMBER = "1", PAGES = "16-36", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110838"} @article{bb114613, AUTHOR = "Kilickaya, M. and Akkus, B.K. and Cakici, R. and Erdem, A. and Erdem, E. and Ikizler Cinbis, N.", TITLE = "Data-driven image captioning via salient region discovery", JOURNAL = IET-CV, VOLUME = "11", YEAR = "2017", NUMBER = "6", MONTH = "September", PAGES = "398-406", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110839"} @article{bb114614, AUTHOR = "Fu, K. and Jin, J.Q. and Cui, R.P. and Sha, F. and Zhang, C.S.", TITLE = "Aligning Where to See and What to Tell: Image Captioning with Region-Based Attention and Scene-Specific Contexts", JOURNAL = PAMI, VOLUME = "39", YEAR = "2017", NUMBER = "12", MONTH = "December", PAGES = "2321-2334", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110840"} @article{bb114615, AUTHOR = "Nian, F.D. and Li, T. and Wang, Y. and Wu, X.Y. and Ni, B.B. and Xu, C.S.", TITLE = "Learning explicit video attributes from mid-level representation for video captioning", JOURNAL = CVIU, VOLUME = "163", YEAR = "2017", NUMBER = "1", PAGES = "126-138", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110841"} @article{bb114616, AUTHOR = "He, X.D. and Deng, L.", TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview", JOURNAL = SPMag, VOLUME = "34", YEAR = "2017", NUMBER = "6", MONTH = "November", PAGES = "109-116", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110842"} @article{bb114617, AUTHOR = "Deng, L. and He, X.D.", TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview", JOURNAL = SPMag, VOLUME = "35", YEAR = "2018", NUMBER = "1", MONTH = "January", PAGES = "178", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110842"} @article{bb114618, AUTHOR = "Li, L.H. and Tang, S. and Zhang, Y.D. and Deng, L.X. and Tian, Q.", TITLE = "GLA: Global-Local Attention for Image Description", JOURNAL = MultMed, VOLUME = "20", YEAR = "2018", NUMBER = "3", MONTH = "March", PAGES = "726-737", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110843"} @article{bb114619, AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.", TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation", JOURNAL = GeoRS, VOLUME = "56", YEAR = "2018", NUMBER = "4", MONTH = "April", PAGES = "2183-2195", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110844"} @article{bb114620, AUTHOR = "Cheng, Q. and Zhang, Q. and Fu, P. and Tu, C.H. and Li, S.", TITLE = "A survey and analysis on automatic image annotation", JOURNAL = PR, VOLUME = "79", YEAR = "2018", PAGES = "242-259", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110845"} @article{bb114621, AUTHOR = "Ben Rejeb, I. and Ouni, S. and Barhoumi, W. and Zagrouba, E.", TITLE = "Fuzzy VA-Files for multi-label image annotation based on visual content of regions", JOURNAL = SIViP, VOLUME = "12", YEAR = "2018", NUMBER = "5", MONTH = "July", PAGES = "877-884", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110846"} @article{bb114622, AUTHOR = "Helmy, T.", TITLE = "A Generic Framework for Semantic Annotation of Images", JOURNAL = IJIG, VOLUME = "18", YEAR = "2018", NUMBER = "3", MONTH = "July", PAGES = "Article 1850013", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110847"} @article{bb114623, AUTHOR = "Wu, C.L. and Wei, Y. and Chu, X.L. and Su, F. and Wang, L.", TITLE = "Modeling visual and word-conditional semantic attention for image captioning", JOURNAL = SP:IC, VOLUME = "67", YEAR = "2018", PAGES = "100-107", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110848"} @article{bb114624, AUTHOR = "Ye, S. and Han, J. and Liu, N.", TITLE = "Attentive Linear Transformation for Image Captioning", JOURNAL = IP, VOLUME = "27", YEAR = "2018", NUMBER = "11", MONTH = "November", PAGES = "5514-5524", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110849"} @article{bb114625, AUTHOR = "Zhang, M. and Yang, Y. and Zhang, H. and Ji, Y. and Shen, H.T. and Chua, T.", TITLE = "More is Better: Precise and Detailed Image Captioning Using Online Positive Recall and Missing Concepts Mining", JOURNAL = IP, VOLUME = "28", YEAR = "2019", NUMBER = "1", MONTH = "January", PAGES = "32-44", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110850"} @article{bb114626, AUTHOR = "Hu, J. and Lam, K.M. and Lou, P. and Liu, Q. and Deng, W.P.", TITLE = "Can a machine have two systems for recognition, like human beings?", JOURNAL = JVCIR, VOLUME = "56", YEAR = "2018", PAGES = "275-286", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110851"} @article{bb114627, AUTHOR = "Bhagat, P.K. and Choudhary, P.", TITLE = "Image annotation: Then and now", JOURNAL = IVC, VOLUME = "80", YEAR = "2018", PAGES = "1-23", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110852"} @article{bb114628, AUTHOR = "Gil Gonzalez, J. and Alvarez Meza, A. and Orozco Gutierrez, A.", TITLE = "Learning from multiple annotators using kernel alignment", JOURNAL = PRL, VOLUME = "116", YEAR = "2018", PAGES = "150-156", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110853"} @article{bb114629, AUTHOR = "Bazrafkan, S. and Javidnia, H. and Corcoran, P.", TITLE = "Latent space mapping for generation of object elements with corresponding data annotation", JOURNAL = PRL, VOLUME = "116", YEAR = "2018", PAGES = "179-186", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110854"} @article{bb114630, AUTHOR = "Gella, S. and Keller, F. and Lapata, M.", TITLE = "Disambiguating Visual Verbs", JOURNAL = PAMI, VOLUME = "41", YEAR = "2019", NUMBER = "2", MONTH = "February", PAGES = "311-322", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110855"} @article{bb114631, AUTHOR = "Xu, N. and Liu, A.A. and Liu, J. and Nie, W.Z. and Su, Y.T.", TITLE = "Scene graph captioner: Image captioning based on structural visual representation", JOURNAL = JVCIR, VOLUME = "58", YEAR = "2019", PAGES = "477-485", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110856"} @article{bb114632, AUTHOR = "Jiu, M.Y. and Sahbi, H.", TITLE = "Deep representation design from deep kernel networks", JOURNAL = PR, VOLUME = "88", YEAR = "2019", PAGES = "447-457", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110857"} @article{bb114633, AUTHOR = "He, X.W. and Shi, B.G. and Bai, X. and Xia, G.S. and Zhang, Z.X. and Dong, W.S.", TITLE = "Image Caption Generation with Part of Speech Guidance", JOURNAL = PRL, VOLUME = "119", YEAR = "2019", PAGES = "229-237", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110858"} @article{bb114634, AUTHOR = "Xiao, X.Y. and Wang, L.F. and Ding, K. and Xiang, S.M. and Pan, C.", TITLE = "Dense semantic embedding network for image captioning", JOURNAL = PR, VOLUME = "90", YEAR = "2019", PAGES = "285-296", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110859"} @article{bb114635, AUTHOR = "Foumani, S.N.M. and Nickabadi, A.", TITLE = "A probabilistic topic model using deep visual word representation for simultaneous image classification and annotation", JOURNAL = JVCIR, VOLUME = "59", YEAR = "2019", PAGES = "195-203", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110860"} @article{bb114636, AUTHOR = "Zhang, X.R. and Wang, X. and Tang, X. and Zhou, H.Y. and Li, C.", TITLE = "Description Generation for Remote Sensing Images Using Attribute Attention Mechanism", JOURNAL = RS, VOLUME = "11", YEAR = "2019", NUMBER = "6", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110861"} @article{bb114637, AUTHOR = "Zheng, H. and Wu, J.H. and Liang, R. and Li, Y. and Li, X.Z.", TITLE = "Multi-task learning for captioning images with novel words", JOURNAL = IET-CV, VOLUME = "13", YEAR = "2019", NUMBER = "3", MONTH = "April", PAGES = "294-301", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110862"} @article{bb114638, AUTHOR = "Ding, S.T. and Qu, S. and Xi, Y.L. and Sangaiah, A.K. and Wan, S.H.", TITLE = "Image caption generation with high-level image features", JOURNAL = PRL, VOLUME = "123", YEAR = "2019", PAGES = "89-95", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110863"} @article{bb114639, AUTHOR = "Liu, X.X. and Xu, Q.Y. and Wang, N.", TITLE = "A survey on deep neural network-based image captioning", JOURNAL = VC, VOLUME = "35", YEAR = "2019", NUMBER = "3", MONTH = "March", PAGES = "445-470", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110864"} @article{bb114640, AUTHOR = "Hossain, M.Z. and Sohel, F. and Shiratuddin, M.F. and Laga, H.", TITLE = "A Comprehensive Survey of Deep Learning for Image Captioning", JOURNAL = Surveys, VOLUME = "51", YEAR = "2019", NUMBER = "6", MONTH = "February", PAGES = "Article No 118", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110865"} @article{bb114641, AUTHOR = "Peng, Y.Q. and Liu, X. and Wang, W.H. and Zhao, X.S. and Wei, M.", TITLE = "Image caption model of double LSTM with scene factors", JOURNAL = IVC, VOLUME = "86", YEAR = "2019", PAGES = "38-44", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110866"} @article{bb114642, AUTHOR = "Zhang, J.J. and Wu, Q. and Zhang, J. and Shen, C.H. and Lu, J.F. and Wu, Q.A.", TITLE = "Heritage image annotation via collective knowledge", JOURNAL = PR, VOLUME = "93", YEAR = "2019", PAGES = "204-214", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110867"} @article{bb114643, AUTHOR = "Verma, Y.", TITLE = "Diverse image annotation with missing labels", JOURNAL = PR, VOLUME = "93", YEAR = "2019", PAGES = "470-484", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110868"} @article{bb114644, AUTHOR = "Markatopoulou, F. and Mezaris, V. and Patras, I.", TITLE = "Implicit and Explicit Concept Relations in Deep Neural Networks for Multi-Label Video/Image Annotation", JOURNAL = CirSysVideo, VOLUME = "29", YEAR = "2019", NUMBER = "6", MONTH = "June", PAGES = "1631-1644", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110869"} @article{bb114645, AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.", TITLE = "High-Quality Image Captioning With Fine-Grained and Semantic-Guided Visual Attention", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "7", MONTH = "July", PAGES = "1681-1693", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110870"} @inproceedings{bb114646, AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.", TITLE = "Fine-Grained and Semantic-Guided Visual Attention for Image Captioning", BOOKTITLE = WACV18, YEAR = "2018", PAGES = "1709-1717", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110871"} @article{bb114647, AUTHOR = "Laib, L. and Allili, M.S. and Ait Aoudia, S.", TITLE = "A probabilistic topic model for event-based image classification and multi-label annotation", JOURNAL = SP:IC, VOLUME = "76", YEAR = "2019", PAGES = "283-294", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110872"} @article{bb114648, AUTHOR = "Olaode, A. and Naghdy, G.", TITLE = "Review of the application of machine learning to the automatic semantic annotation of images", JOURNAL = IET-IPR, VOLUME = "13", YEAR = "2019", NUMBER = "8", MONTH = "June", PAGES = "1232-1245", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110873"} @article{bb114649, AUTHOR = "Li, X. and Jiang, S.", TITLE = "Know More Say Less: Image Captioning Based on Scene Graphs", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "8", MONTH = "August", PAGES = "2117-2130", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110874"} @article{bb114650, AUTHOR = "Zhang, C.J. and Cheng, J. and Tian, Q.", TITLE = "Multiview, Few-Labeled Object Categorization by Predicting Labels With View Consistency", JOURNAL = Cyber, VOLUME = "49", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "3834-3843", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110875"} @article{bb114651, AUTHOR = "Sharif, N. and White, L. and Bennamoun, M. and Liu, W. and Shah, S.A.A.", TITLE = "LCEval: Learned Composite Metric for Caption Evaluation", JOURNAL = IJCV, VOLUME = "127", YEAR = "2019", NUMBER = "10", MONTH = "October", PAGES = "1586-1610", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110876"} @article{bb114652, AUTHOR = "Zhang, Z.Y. and Diao, W.H. and Zhang, W.K. and Yan, M.L. and Gao, X. and Sun, X.", TITLE = "LAM: Remote Sensing Image Captioning with Label-Attention Mechanism", JOURNAL = RS, VOLUME = "11", YEAR = "2019", NUMBER = "20", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110877"} @article{bb114653, AUTHOR = "Fu, K. and Li, Y. and Zhang, W.K. and Yu, H.F. and Sun, X.", TITLE = "Boosting Memory with a Persistent Memory Mechanism for Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "12", YEAR = "2020", NUMBER = "11", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110878"} @article{bb114654, AUTHOR = "Tan, J.H. and Chan, C.S. and Chuah, J.H.", TITLE = "COMIC: Toward A Compact Image Captioning Model With Attention", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "10", MONTH = "October", PAGES = "2686-2696", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110879"} @article{bb114655, AUTHOR = "Zhou, L. and Zhang, Y. and Jiang, Y. and Zhang, T. and Fan, W.", TITLE = "Re-Caption: Saliency-Enhanced Image Captioning Through Two-Phase Learning", JOURNAL = IP, VOLUME = "29", YEAR = "2020", NUMBER = "1", PAGES = "694-709", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110880"} @article{bb114656, AUTHOR = "Yang, L. and Hu, H.F.", TITLE = "Visual Skeleton and Reparative Attention for Part-of-Speech image captioning system", JOURNAL = CVIU, VOLUME = "189", YEAR = "2019", PAGES = "102819", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110881"} @article{bb114657, AUTHOR = "Wang, J.B. and Wang, W. and Wang, L. and Wang, Z.Y. and Feng, D.D. and Tan, T.N.", TITLE = "Learning visual relationship and context-aware attention for image captioning", JOURNAL = PR, VOLUME = "98", YEAR = "2020", PAGES = "107075", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110882"} @article{bb114658, AUTHOR = "Xiao, X. and Wang, L. and Ding, K. and Xiang, S. and Pan, C.", TITLE = "Deep Hierarchical Encoder-Decoder Network for Image Captioning", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "2942-2956", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110883"} @article{bb114659, AUTHOR = "Jiang, T. and Zhang, Z. and Yang, Y.", TITLE = "Modeling coverage with semantic embedding for image caption generation", JOURNAL = VC, VOLUME = "35", YEAR = "2018", NUMBER = "11", MONTH = "November", PAGES = "1655-1665", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110884"} @article{bb114660, AUTHOR = "Tang, C. and Liu, X. and Wang, P. and Zhang, C. and Li, M. and Wang, L.", TITLE = "Adaptive Hypergraph Embedded Semi-Supervised Multi-Label Image Annotation", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "2837-2849", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110885"} @article{bb114661, AUTHOR = "Mundnich, K. and Booth, B.M. and Girault, B. and Narayanan, S.", TITLE = "Generating labels for regression of subjective constructs using triplet embeddings", JOURNAL = PRL, VOLUME = "128", YEAR = "2019", PAGES = "385-392", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110886"} @article{bb114662, AUTHOR = "Lu, X. and Wang, B. and Zheng, X.", TITLE = "Sound Active Attention Framework for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "58", YEAR = "2020", NUMBER = "3", MONTH = "March", PAGES = "1985-2000", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110887"} @article{bb114663, AUTHOR = "Wu, L. and Xu, M. and Wang, J. and Perry, S.", TITLE = "Recall What You See Continually Using GridLSTM in Image Captioning", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "3", MONTH = "March", PAGES = "808-818", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110888"} @article{bb114664, AUTHOR = "Li, Y.Y. and Fang, S.K. and Jiao, L.C. and Liu, R.J. and Shang, R.H.", TITLE = "A Multi-Level Attention Model for Remote Sensing Image Captions", JOURNAL = RS, VOLUME = "12", YEAR = "2020", NUMBER = "6", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110889"} @article{bb114665, AUTHOR = "Chaudhary, C. and Goyal, P. and Prasad, D.N. and Chen, Y.P.", TITLE = "Enhancing the Quality of Image Tagging Using a Visio-Textual Knowledge Base", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "4", MONTH = "April", PAGES = "897-911", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110890"} @article{bb114666, AUTHOR = "Chen, X.H. and Zhang, M.X. and Wang, Z. and Zuo, L. and Li, B. and Yang, Y.", TITLE = "Leveraging unpaired out-of-domain data for image captioning", JOURNAL = PRL, VOLUME = "132", YEAR = "2020", PAGES = "132-140", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110891"} @article{bb114667, AUTHOR = "Xu, N. and Zhang, H. and Liu, A. and Nie, W. and Su, Y. and Nie, J. and Zhang, Y.", TITLE = "Multi-Level Policy and Reward-Based Deep Reinforcement Learning Framework for Image Captioning", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "5", MONTH = "May", PAGES = "1372-1383", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110892"} @article{bb114668, AUTHOR = "Deng, Z.R. and Jiang, Z.Q. and Lan, R. and Huang, W.M. and Luo, X.N.", TITLE = "Image captioning using DenseNet network and adaptive attention", JOURNAL = SP:IC, VOLUME = "85", YEAR = "2020", PAGES = "115836", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110893"} @article{bb114669, AUTHOR = "Ji, J. and Xu, C. and Zhang, X. and Wang, B. and Song, X.", TITLE = "Spatio-Temporal Memory Attention for Image Captioning", JOURNAL = IP, VOLUME = "29", YEAR = "2020", PAGES = "7615-7628", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110894"} @article{bb114670, AUTHOR = "Guo, L. and Liu, J. and Lu, S. and Lu, H.", TITLE = "Show, Tell, and Polish: Ruminant Decoding for Image Captioning", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "8", MONTH = "August", PAGES = "2149-2162", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110895"} @article{bb114671, AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.", TITLE = "Architecture to improve the accuracy of automatic image annotation systems", JOURNAL = IET-CV, VOLUME = "14", YEAR = "2020", NUMBER = "5", MONTH = "August", PAGES = "214-223", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110896"} @article{bb114672, AUTHOR = "Theodosiou, Z. and Tsapatsoulis, N.", TITLE = "Image annotation: the effects of content, lexicon and annotation method", JOURNAL = MultInfoRetr, VOLUME = "9", YEAR = "2020", NUMBER = "3", MONTH = "September", PAGES = "191-203", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110897"} @article{bb114673, AUTHOR = "Che, W.B. and Fan, X.P. and Xiong, R.Q. and Zhao, D.B.", TITLE = "Visual Relationship Embedding Network for Image Paragraph Generation", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "9", MONTH = "September", PAGES = "2307-2320", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110898"} @article{bb114674, AUTHOR = "Feng, Q. and Wu, Y. and Fan, H. and Yan, C. and Xu, M. and Yang, Y.", TITLE = "Cascaded Revision Network for Novel Object Captioning", JOURNAL = CirSysVideo, VOLUME = "30", YEAR = "2020", NUMBER = "10", MONTH = "October", PAGES = "3413-3421", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110899"} @article{bb114675, AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L. and Ma, H.F.", TITLE = "The synergy of double attention: Combine sentence-level and word-level attention for image captioning", JOURNAL = CVIU, VOLUME = "201", YEAR = "2020", PAGES = "103068", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110900"} @article{bb114676, AUTHOR = "Shilpa, M. and He, J. and Zhao, Y. and Sun, B. and Yu, L.J.", TITLE = "Feedback evaluations to promote image captioning", JOURNAL = IET-IPR, VOLUME = "14", YEAR = "2020", NUMBER = "13", MONTH = "November", PAGES = "3021-3027", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110901"} @article{bb114677, AUTHOR = "Zhang, J. and Mei, K. and Zheng, Y. and Fan, J.", TITLE = "Integrating Part of Speech Guidance for Image Captioning", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "92-104", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110902"} @inproceedings{bb114678, AUTHOR = "Sharif, N. and Jalwana, M.A.A.K. and Bennamoun, M. and Liu, W. and Shah, S.A.A.", TITLE = "Leveraging Linguistically-aware Object Relations and NASNet for Image Captioning", BOOKTITLE = IVCNZ20, YEAR = "2020", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110903"} @article{bb114679, AUTHOR = "Gouthaman, K.V. and Nambiar, A. and Srinivas, K.S. and Mittal, A.", TITLE = "Linguistically-aware attention for reducing the semantic gap in vision-language tasks", JOURNAL = PR, VOLUME = "112", YEAR = "2021", PAGES = "107812", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110904"} @article{bb114680, AUTHOR = "Liu, H. and Zhang, S. and Lin, K. and Wen, J. and Li, J. and Hu, X.", TITLE = "Vocabulary-Wide Credit Assignment for Training Image Captioning Models", JOURNAL = IP, VOLUME = "30", YEAR = "2021", PAGES = "2450-2460", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110905"} @article{bb114681, AUTHOR = "Xu, N. and Tian, H.S. and Wang, Y.H. and Nie, W.Z. and Song, D. and Liu, A.A. and Liu, W.", TITLE = "Coupled-dynamic learning for vision and language: Exploring Interaction between different tasks", JOURNAL = PR, VOLUME = "113", YEAR = "2021", PAGES = "107829", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110906"} @article{bb114682, AUTHOR = "Zhang, J. and Li, K.K. and Wang, Z.", TITLE = "Parallel-fusion LSTM with synchronous semantic and visual information for image captioning", JOURNAL = JVCIR, VOLUME = "75", YEAR = "2021", PAGES = "103044", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110907"} @article{bb114683, AUTHOR = "Yang, L. and Wang, H. and Tang, P. and Li, Q.", TITLE = "CaptionNet: A Tailor-made Recurrent Neural Network for Generating Image Descriptions", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "835-845", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110908"} @article{bb114684, AUTHOR = "Liu, A.A. and Wang, Y.H. and Xu, N. and Liu, S. and Li, X.", TITLE = "Scene-Graph-Guided message passing network for dense captioning", JOURNAL = PRL, VOLUME = "145", YEAR = "2021", PAGES = "187-193", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110909"} @article{bb114685, AUTHOR = "Zhang, L. and Zhang, Y.S. and Zhao, X. and Zou, Z.X.", TITLE = "Image captioning via proximal policy optimization", JOURNAL = IVC, VOLUME = "108", YEAR = "2021", PAGES = "104126", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110910"} @article{bb114686, AUTHOR = "Ji, J.Z. and Du, Z.R. and Zhang, X.D.", TITLE = "Divergent-convergent attention for image captioning", JOURNAL = PR, VOLUME = "115", YEAR = "2021", PAGES = "107928", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110911"} @article{bb114687, AUTHOR = "Wei, Y.W. and Wu, C.L. and Jia, Z.Y. and Hu, X. and Guo, S. and Shi, H.T.", TITLE = "Past is important: Improved image captioning by looking back in time", JOURNAL = SP:IC, VOLUME = "94", YEAR = "2021", PAGES = "116183", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110912"} @article{bb114688, AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.", TITLE = "Exploring region relationships implicitly: Image captioning with visual relationship attention", JOURNAL = IVC, VOLUME = "109", YEAR = "2021", PAGES = "104146", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110913"} @article{bb114689, AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.", TITLE = "Exploring Pairwise Relationships Adaptively From Linguistic Context in Image Captioning", JOURNAL = MultMed, VOLUME = "24", YEAR = "2022", PAGES = "3101-3113", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110914"} @article{bb114690, AUTHOR = "Li, X.L. and Zhang, X.T. and Huang, W. and Wang, Q.", TITLE = "Truncation Cross Entropy Loss for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "6", MONTH = "June", PAGES = "5246-5257", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110915"} @article{bb114691, AUTHOR = "He, S. and Lu, Y.Y. and Chen, S.N.", TITLE = "Image Captioning Algorithm Based on Multi-Branch CNN and Bi-LSTM", JOURNAL = IEICE, VOLUME = "E104-D", YEAR = "2021", NUMBER = "7", MONTH = "July", PAGES = "941-947", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110916"} @article{bb114692, AUTHOR = "Zhong, X. and Nie, G.Z. and Huang, W.X. and Liu, W.X. and Ma, B. and Lin, C.W.", TITLE = "Attention-guided image captioning with adaptive global and local feature fusion", JOURNAL = JVCIR, VOLUME = "78", YEAR = "2021", PAGES = "103138", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110917"} @article{bb114693, AUTHOR = "Sumbul, G. and Nayak, S. and Demir, B.", TITLE = "SD-RSIC: Summarization-Driven Deep Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "8", MONTH = "August", PAGES = "6922-6934", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110918"} @article{bb114694, AUTHOR = "Wu, J. and Chen, T.S. and Wu, H.F. and Yang, Z. and Luo, G.C. and Lin, L.", TITLE = "Fine-Grained Image Captioning With Global-Local Discriminative Objective", JOURNAL = MultMed, VOLUME = "23", YEAR = "2021", PAGES = "2413-2427", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110919"} @article{bb114695, AUTHOR = "Wu, L.X. and Xu, M. and Sang, L. and Yao, T. and Mei, T.", TITLE = "Noise Augmented Double-Stream Graph Convolutional Networks for Image Captioning", JOURNAL = CirSysVideo, VOLUME = "31", YEAR = "2021", NUMBER = "8", MONTH = "August", PAGES = "3118-3127", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110920"} @article{bb114696, AUTHOR = "Nivedita, M. and Chandrashekar, P. and Mahapatra, S. and Phamila, Y.A.V. and Selvaperumal, S.K.", TITLE = "Image Captioning for Video Surveillance System using Neural Networks", JOURNAL = IJIG, VOLUME = "21", YEAR = "2021", NUMBER = "4", MONTH = "October", PAGES = "2150044", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110921"} @article{bb114697, AUTHOR = "Haghighi, F. and Taher, M.R.H. and Zhou, Z.W. and Gotway, M.B. and Liang, J.M.", TITLE = "Transferable Visual Words: Exploiting the Semantics of Anatomical Patterns for Self-Supervised Learning", JOURNAL = MedImg, VOLUME = "40", YEAR = "2021", NUMBER = "10", MONTH = "October", PAGES = "2857-2868", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110922"} @article{bb114698, AUTHOR = "Wang, Q. and Huang, W. and Zhang, X. and Li, X.L.", TITLE = "Word-Sentence Framework for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "12", MONTH = "December", PAGES = "10532-10543", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110923"} @article{bb114699, AUTHOR = "Wan, B.Y. and Jiang, W.H. and Fang, Y.M. and Zhu, M.W. and Li, Q. and Liu, Y.", TITLE = "Revisiting image captioning via maximum discrepancy competition", JOURNAL = PR, VOLUME = "122", YEAR = "2022", PAGES = "108358", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT110924"}