@article{bb122700,
        AUTHOR = "Chen, X.H. and Zhang, M.X. and Wang, Z. and Zuo, L. and Li, B. and Yang, Y.",
        TITLE = "Leveraging unpaired out-of-domain data for image captioning",
        JOURNAL = PRL,
        VOLUME = "132",
        YEAR = "2020",
        PAGES = "132-140",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118804"}

@article{bb122701,
        AUTHOR = "Xu, N. and Zhang, H. and Liu, A. and Nie, W. and Su, Y. and Nie, J. and Zhang, Y.",
        TITLE = "Multi-Level Policy and Reward-Based Deep Reinforcement Learning
Framework for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1372-1383",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118805"}

@article{bb122702,
        AUTHOR = "Guo, L. and Liu, J. and Lu, S. and Lu, H.",
        TITLE = "Show, Tell, and Polish: Ruminant Decoding for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "2149-2162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118806"}

@article{bb122703,
        AUTHOR = "Feng, Q. and Wu, Y. and Fan, H. and Yan, C. and Xu, M. and Yang, Y.",
        TITLE = "Cascaded Revision Network for Novel Object Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "30",
        YEAR = "2020",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "3413-3421",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118807"}

@article{bb122704,
        AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L. and Ma, H.F.",
        TITLE = "The synergy of double attention: Combine sentence-level and
word-level attention for image captioning",
        JOURNAL = CVIU,
        VOLUME = "201",
        YEAR = "2020",
        PAGES = "103068",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118808"}

@article{bb122705,
        AUTHOR = "Shilpa, M. and He, J. and Zhao, Y.J. and Sun, B. and Yu, L.J.",
        TITLE = "Feedback evaluations to promote image captioning",
        JOURNAL = IET-IPR,
        VOLUME = "14",
        YEAR = "2020",
        NUMBER = "13",
        MONTH = "November",
        PAGES = "3021-3027",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118809"}

@article{bb122706,
        AUTHOR = "Liu, H. and Zhang, S. and Lin, K. and Wen, J. and Li, J. and Hu, X.",
        TITLE = "Vocabulary-Wide Credit Assignment for Training Image Captioning
Models",
        JOURNAL = IP,
        VOLUME = "30",
        YEAR = "2021",
        PAGES = "2450-2460",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118810"}

@article{bb122707,
        AUTHOR = "Xu, N. and Tian, H.S. and Wang, Y.H. and Nie, W.Z. and Song, D. and Liu, A.A. and Liu, W.",
        TITLE = "Coupled-dynamic learning for vision and language:
Exploring Interaction between different tasks",
        JOURNAL = PR,
        VOLUME = "113",
        YEAR = "2021",
        PAGES = "107829",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118811"}

@article{bb122708,
        AUTHOR = "Yang, L. and Wang, H. and Tang, P. and Li, Q.",
        TITLE = "CaptionNet: A Tailor-made Recurrent Neural Network for Generating
Image Descriptions",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "835-845",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118812"}

@article{bb122709,
        AUTHOR = "Liu, A.A. and Wang, Y.H. and Xu, N. and Liu, S. and Li, X.",
        TITLE = "Scene-Graph-Guided message passing network for dense captioning",
        JOURNAL = PRL,
        VOLUME = "145",
        YEAR = "2021",
        PAGES = "187-193",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118813"}

@article{bb122710,
        AUTHOR = "Zhang, L. and Zhang, Y.S. and Zhao, X. and Zou, Z.X.",
        TITLE = "Image captioning via proximal policy optimization",
        JOURNAL = IVC,
        VOLUME = "108",
        YEAR = "2021",
        PAGES = "104126",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118814"}

@article{bb122711,
        AUTHOR = "Ji, J.Z. and Du, Z.R. and Zhang, X.D.",
        TITLE = "Divergent-convergent attention for image captioning",
        JOURNAL = PR,
        VOLUME = "115",
        YEAR = "2021",
        PAGES = "107928",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118815"}

@article{bb122712,
        AUTHOR = "Wei, Y.W. and Wu, C.L. and Jia, Z.Y. and Hu, X. and Guo, S. and Shi, H.T.",
        TITLE = "Past is important: Improved image captioning by looking back in time",
        JOURNAL = SP:IC,
        VOLUME = "94",
        YEAR = "2021",
        PAGES = "116183",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118816"}

@article{bb122713,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Exploring region relationships implicitly:
Image captioning with visual relationship attention",
        JOURNAL = IVC,
        VOLUME = "109",
        YEAR = "2021",
        PAGES = "104146",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118817"}

@article{bb122714,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Exploring Pairwise Relationships Adaptively From Linguistic Context
in Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "3101-3113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118818"}

@article{bb122715,
        AUTHOR = "Li, X.L. and Zhang, X.T. and Huang, W. and Wang, Q.",
        TITLE = "Truncation Cross Entropy Loss for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "5246-5257",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118819"}

@article{bb122716,
        AUTHOR = "Zhong, X. and Nie, G.Z. and Huang, W.X. and Liu, W.X. and Ma, B. and Lin, C.W.",
        TITLE = "Attention-guided image captioning with adaptive global and local
feature fusion",
        JOURNAL = JVCIR,
        VOLUME = "78",
        YEAR = "2021",
        PAGES = "103138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118820"}

@article{bb122717,
        AUTHOR = "Sumbul, G. and Nayak, S. and Demir, B.",
        TITLE = "SD-RSIC: Summarization-Driven Deep Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6922-6934",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118821"}

@article{bb122718,
        AUTHOR = "Wu, J. and Chen, T.S. and Wu, H.F. and Yang, Z. and Luo, G.C. and Lin, L.",
        TITLE = "Fine-Grained Image Captioning With Global-Local Discriminative
Objective",
        JOURNAL = MultMed,
        VOLUME = "23",
        YEAR = "2021",
        PAGES = "2413-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118822"}

@article{bb122719,
        AUTHOR = "Wu, L.X. and Xu, M. and Sang, L. and Yao, T. and Mei, T.",
        TITLE = "Noise Augmented Double-Stream Graph Convolutional Networks for Image
Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3118-3127",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118823"}

@article{bb122720,
        AUTHOR = "Nivedita, M. and Chandrashekar, P. and Mahapatra, S. and Phamila, Y.A.V. and Selvaperumal, S.K.",
        TITLE = "Image Captioning for Video Surveillance System using Neural Networks",
        JOURNAL = IJIG,
        VOLUME = "21",
        YEAR = "2021",
        NUMBER = "4",
        MONTH = "October",
        PAGES = "2150044",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118824"}

@article{bb122721,
        AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.",
        TITLE = "Word-Sentence Framework for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "10532-10543",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118825"}

@article{bb122722,
        AUTHOR = "Wan, B.Y. and Jiang, W.H. and Fang, Y.M. and Zhu, M.W. and Li, Q. and Liu, Y.",
        TITLE = "Revisiting image captioning via maximum discrepancy competition",
        JOURNAL = PR,
        VOLUME = "122",
        YEAR = "2022",
        PAGES = "108358",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118826"}

@article{bb122723,
        AUTHOR = "Chen, T.Y. and Li, Z.X. and Wu, J.L. and Ma, H.F. and Su, B.P.",
        TITLE = "Improving image captioning with Pyramid Attention and SC-GAN",
        JOURNAL = IVC,
        VOLUME = "117",
        YEAR = "2022",
        PAGES = "104340",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118827"}

@article{bb122724,
        AUTHOR = "Zhou, Y.J. and Long, J.F. and Xu, S.P. and Shang, L.",
        TITLE = "Attribute-driven image captioning via soft-switch pointer",
        JOURNAL = PRL,
        VOLUME = "152",
        YEAR = "2021",
        PAGES = "34-41",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118828"}

@article{bb122725,
        AUTHOR = "Zha, Z.J. and Liu, D. and Zhang, H.W. and Zhang, Y.D. and Wu, F.",
        TITLE = "Context-Aware Visual Policy Network for Fine-Grained Image Captioning",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "710-722",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118829"}

@article{bb122726,
        AUTHOR = "Wang, Q.Z. and Wan, J. and Chan, A.B.",
        TITLE = "On Diversity in Image Captioning: Metrics and Methods",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1035-1049",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118830"}

@inproceedings{bb122727,
        AUTHOR = "Wang, J. and Xu, W.J. and Wang, Q.Z. and Chan, A.B.",
        TITLE = "Compare and Reweight:
Distinctive Image Captioning Using Similar Images Sets",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "I:370-386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118831"}

@article{bb122728,
        AUTHOR = "Luo, G.F. and Cheng, L.J. and Jing, C. and Zhao, C. and Song, G.Z.",
        TITLE = "A thorough review of models, evaluation metrics, and datasets on
image captioning",
        JOURNAL = IET-IPR,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "2",
        PAGES = "311-332",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118832"}

@article{bb122729,
        AUTHOR = "Ben, H.X. and Pan, Y.W. and Li, Y. and Yao, T. and Hong, R.C. and Wang, M. and Mei, T.",
        TITLE = "Unpaired Image Captioning With semantic-Constrained Self-Learning",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        PAGES = "904-916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118833"}

@article{bb122730,
        AUTHOR = "Song, P.P. and Guo, D. and Zhou, J.X. and Xu, M.L. and Wang, M.",
        TITLE = "Memorial GAN With Joint Semantic Optimization for Unpaired Image
Captioning",
        JOURNAL = Cyber,
        VOLUME = "53",
        YEAR = "2023",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4388-4399",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118834"}

@inproceedings{bb122731,
        AUTHOR = "Li, Y. and Yao, T. and Pan, Y.W. and Chao, H.Y. and Mei, T.",
        TITLE = "Pointing Novel Objects in Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12489-12498",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118835"}

@article{bb122732,
        AUTHOR = "Liu, M.F. and Hu, H.J. and Li, L.J. and Yu, Y. and Guan, W.L.",
        TITLE = "Chinese Image Caption Generation via Visual Attention and Topic
Modeling",
        JOURNAL = Cyber,
        VOLUME = "52",
        YEAR = "2022",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1247-1257",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118836"}

@article{bb122733,
        AUTHOR = "Yang, Q.Q. and Ni, Z.H. and Ren, P.",
        TITLE = "Meta captioning:
A meta learning based remote sensing image captioning framework",
        JOURNAL = PandRS,
        VOLUME = "186",
        YEAR = "2022",
        PAGES = "190-200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118837"}

@article{bb122734,
        AUTHOR = "Yang, X. and Zhang, H.W. and Cai, J.F.",
        TITLE = "Auto-Encoding and Distilling Scene Graphs for Image Captioning",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "2313-2327",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118838"}

@article{bb122735,
        AUTHOR = "Yang, X. and Zhang, H.W. and Cai, J.F.",
        TITLE = "Deconfounded Image Captioning: A Causal Retrospect",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "12996-13010",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118839"}

@inproceedings{bb122736,
        AUTHOR = "Yang, X. and Tang, K. and Zhang, H.W. and Cai, J.F.",
        TITLE = "Auto-Encoding Scene Graphs for Image Captioning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10677-10686",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118840"}

@article{bb122737,
        AUTHOR = "Yang, Z.P. and Wang, P.B. and Chu, T.S. and Yang, J.",
        TITLE = "Human-Centric Image Captioning",
        JOURNAL = PR,
        VOLUME = "126",
        YEAR = "2022",
        PAGES = "108545",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118841"}

@article{bb122738,
        AUTHOR = "Li, X. and Zhang, W.K. and Sun, X. and Gao, X.",
        TITLE = "Without detection: Two-step clustering features with local-global
attention for image captioning",
        JOURNAL = IET-CV,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "3",
        PAGES = "280-294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118842"}

@article{bb122739,
        AUTHOR = "Yu, L.T. and Zhang, J. and Wu, Q.",
        TITLE = "Dual Attention on Pyramid Feature Maps for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "24",
        YEAR = "2022",
        NUMBER = "2022",
        PAGES = "1775-1786",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118843"}

@article{bb122740,
        AUTHOR = "Zhang, M. and Chen, J.X. and Li, P.F. and Jiang, M. and Zhou, Z.",
        TITLE = "Topic scene graphs for image captioning",
        JOURNAL = IET-CV,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "4",
        PAGES = "364-375",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118844"}

@article{bb122741,
        AUTHOR = "Yu, Q. and Zhang, C.X. and Weng, L. and Xiang, S.M. and Pan, C.H.",
        TITLE = "Scene captioning with deep fusion of images and point clouds",
        JOURNAL = PRL,
        VOLUME = "158",
        YEAR = "2022",
        PAGES = "9-15",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118845"}

@article{bb122742,
        AUTHOR = "Chaudhari, C.P. and Devane, S.",
        TITLE = "Improved Framework using Rider Optimization Algorithm for Precise Image
Caption Generation",
        JOURNAL = IJIG,
        VOLUME = "22",
        YEAR = "2022",
        NUMBER = "2",
        MONTH = "April",
        PAGES = "2250021",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118846"}

@article{bb122743,
        AUTHOR = "Shao, X.J. and Xiang, Z.L. and Li, Y.X. and Zhang, M.J.",
        TITLE = "Variational joint self-attention for image captioning",
        JOURNAL = IET-IPR,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "8",
        PAGES = "2075-2086",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118847"}

@article{bb122744,
        AUTHOR = "Li, Y.C. and Wu, C. and Li, L. and Liu, Y.H. and Zhu, J.",
        TITLE = "Caption Generation From Road Images for Traffic Scene Modeling",
        JOURNAL = ITS,
        VOLUME = "23",
        YEAR = "2022",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "7805-7816",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118848"}

@article{bb122745,
        AUTHOR = "Wang, Y.H. and Xu, N. and Liu, A.A. and Li, W.H. and Zhang, Y.D.",
        TITLE = "High-Order Interaction Learning for Image Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4417-4430",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118849"}

@article{bb122746,
        AUTHOR = "Guo, D.D. and Lu, R.Y. and Chen, B. and Zeng, Z.Q. and Zhou, M.Y.",
        TITLE = "Matching Visual Features to Hierarchical Semantic Topics for Image
Paragraph Captioning",
        JOURNAL = IJCV,
        VOLUME = "130",
        YEAR = "2022",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1920-1937",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118850"}

@article{bb122747,
        AUTHOR = "Demirel, B. and Cinbis, R.G.",
        TITLE = "Caption generation on scenes with seen and unseen object categories",
        JOURNAL = IVC,
        VOLUME = "124",
        YEAR = "2022",
        PAGES = "104515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118851"}

@article{bb122748,
        AUTHOR = "Liu, Z.Y. and Dong, A.M. and Yu, J.G. and Han, Y.B. and Zhou, Y. and Zhao, K.",
        TITLE = "Scene classification for remote sensing images with self-attention
augmented CNN",
        JOURNAL = IET-IPR,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "11",
        PAGES = "3085-3096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118852"}

@article{bb122749,
        AUTHOR = "Wu, X.X. and Zhao, W.T. and Luo, J.B.",
        TITLE = "Learning Cooperative Neural Modules for Stylized Image Captioning",
        JOURNAL = IJCV,
        VOLUME = "130",
        YEAR = "2022",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2305-2320",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118853"}

@article{bb122750,
        AUTHOR = "Zhou, H. and Du, X.P. and Xia, L. and Li, S.",
        TITLE = "Self-Learning for Few-Shot Remote Sensing Image Captioning",
        JOURNAL = RS,
        VOLUME = "14",
        YEAR = "2022",
        NUMBER = "18",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118854"}

@article{bb122751,
        AUTHOR = "Stefanini, M. and Cornia, M. and Baraldi, L. and Cascianelli, S. and Fiameni, G. and Cucchiara, R.",
        TITLE = "From Show to Tell: A Survey on Deep Learning-Based Image Captioning",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "539-559",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118855"}

@article{bb122752,
        AUTHOR = "Wu, Y. and Jiang, L. and Yang, Y.",
        TITLE = "Switchable Novel Object Captioner",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "1162-1173",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118856"}

@article{bb122753,
        AUTHOR = "Yang, X. and Zhang, H.W. and Gao, C.Y. and Cai, J.F.",
        TITLE = "Learning to Collocate Visual-Linguistic Neural Modules for Image
Captioning",
        JOURNAL = IJCV,
        VOLUME = "131",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "82-100",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118857"}

@inproceedings{bb122754,
        AUTHOR = "Yang, X. and Zhang, H.W. and Cai, J.F.",
        TITLE = "Learning to Collocate Neural Modules for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4249-4259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118858"}

@article{bb122755,
        AUTHOR = "Ma, Y.W. and Ji, J.Y. and Sun, X.S. and Zhou, Y. and Ji, R.R.",
        TITLE = "Towards local visual modeling for image captioning",
        JOURNAL = PR,
        VOLUME = "138",
        YEAR = "2023",
        PAGES = "109420",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118859"}

@article{bb122756,
        AUTHOR = "Barati, A. and Farsi, H. and Mohamadzadeh, S.",
        TITLE = "Integration of the latent variable knowledge into deep image
captioning with Bayesian modeling",
        JOURNAL = IET-IPR,
        VOLUME = "17",
        YEAR = "2023",
        NUMBER = "7",
        PAGES = "2256-2271",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118860"}

@article{bb122757,
        AUTHOR = "Feng, J.L. and Zhao, J.P.",
        TITLE = "Effectively Utilizing the Category Labels for Image Captioning",
        JOURNAL = IEICE,
        VOLUME = "E106-D",
        YEAR = "2023",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "617-624",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118861"}

@article{bb122758,
        AUTHOR = "Wang, D.P. and Hu, Z.Z. and Zhou, Y. and Hong, R.C. and Wang, M.",
        TITLE = "A Text-Guided Generation and Refinement Model for Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "2966-2977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118862"}

@article{bb122759,
        AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.",
        TITLE = "GLCM: Global-Local Captioning Model for Remote Sensing Image
Captioning",
        JOURNAL = Cyber,
        VOLUME = "53",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "6910-6922",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118863"}

@article{bb122760,
        AUTHOR = "Ji, J.Y. and Huang, X.Y. and Sun, X.S. and Zhou, Y. and Luo, G. and Cao, L.J. and Liu, J.Z. and Shao, L. and Ji, R.R.",
        TITLE = "Multi-Branch Distance-Sensitive Self-Attention Network for Image
Captioning",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "3962-3974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118864"}

@article{bb122761,
        AUTHOR = "Cornia, M. and Baraldi, L. and Tal, A. and Cucchiara, R.",
        TITLE = "Fully-attentive iterative networks for region-based controllable
image and video captioning",
        JOURNAL = CVIU,
        VOLUME = "237",
        YEAR = "2023",
        PAGES = "103857",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118865"}

@article{bb122762,
        AUTHOR = "Li, Y.P. and Zhang, X.R. and Cheng, X. and Tang, X. and Jiao, L.C.",
        TITLE = "Learning consensus-aware semantic knowledge for remote sensing image
captioning",
        JOURNAL = PR,
        VOLUME = "145",
        YEAR = "2024",
        PAGES = "109893",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118866"}

@article{bb122763,
        AUTHOR = "Al Qatf, M. and Wang, X. and Hawbani, A. and Abdussalam, A. and Alsamhi, S.H.",
        TITLE = "Image Captioning With Novel Topics Guidance and Retrieval-Based
Topics Re-Weighting",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "5984-5999",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118867"}

@article{bb122764,
        AUTHOR = "Zhu, P.P. and Wang, X. and Luo, Y. and Sun, Z.L. and Zheng, W.S. and Wang, Y. and Chen, C.",
        TITLE = "Unpaired Image Captioning by Image-Level Weakly-Supervised Visual
Concept Recognition",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "6702-6716",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118868"}

@article{bb122765,
        AUTHOR = "Hu, N.N. and Ming, Y. and Fan, C.X. and Feng, F. and Lyu, B.Y.",
        TITLE = "TSFNet: Triple-Steam Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "6904-6916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118869"}

@article{bb122766,
        AUTHOR = "Gonzalez Chavez, O. and Ruiz, G. and Moctezuma, D. and Ramirez delReal, T.",
        TITLE = "Are metrics measuring what they should? An evaluation of Image
Captioning task metrics",
        JOURNAL = SP:IC,
        VOLUME = "120",
        YEAR = "2024",
        PAGES = "117071",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118870"}

@article{bb122767,
        AUTHOR = "Padate, R. and Jain, A. and Kalla, M. and Sharma, A.",
        TITLE = "A Widespread Assessment and Open Issues on Image Captioning Models",
        JOURNAL = IJIG,
        VOLUME = "23",
        YEAR = "2023",
        NUMBER = "6 2023",
        PAGES = "2350057",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118871"}

@article{bb122768,
        AUTHOR = "Shao, Z. and Han, J.G. and Debattista, K. and Pang, Y.W.",
        TITLE = "Textual Context-Aware Dense Captioning With Diverse Words",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "8753-8766",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118872"}

@article{bb122769,
        AUTHOR = "Cheng, J. and Wu, F. and Liu, L. and Zhang, Q. and Rutkowski, L. and Tao, D.C.",
        TITLE = "InDecGAN: Learning to Generate Complex Images From Captions via
Independent Object-Level Decomposition and Enhancement",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "8279-8293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118873"}

@article{bb122770,
        AUTHOR = "Ding, N. and Deng, C.R. and Tan, M.K. and Du, Q. and Ge, Z.W. and Wu, Q.",
        TITLE = "Image Captioning With Controllable and Adaptive Length Levels",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "764-779",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118874"}

@inproceedings{bb122771,
        AUTHOR = "Xu, G.H. and Niu, S.C. and Tan, M.K. and Luo, Y.C. and Du, Q. and Wu, Q.",
        TITLE = "Towards Accurate Text-based Image Captioning with Content Diversity
Exploration",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "12632-12641",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118875"}

@article{bb122772,
        AUTHOR = "Zhu, P.P. and Wang, X. and Zhu, L. and Sun, Z.L. and Zheng, W.S. and Wang, Y. and Chen, C.W.",
        TITLE = "Prompt-Based Learning for Unpaired Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "379-393",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118876"}

@article{bb122773,
        AUTHOR = "Liu, A.A. and Zhai, Y.C. and Xu, N. and Tian, H. and Nie, W.Z. and Zhang, Y.D.",
        TITLE = "Event-Aware Retrospective Learning for Knowledge-Based Image
Captioning",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "4898-4911",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118877"}

@article{bb122774,
        AUTHOR = "Song, L.F. and Li, F. and Wang, Y. and Liu, Y. and Wang, Y. and Xiang, S.M.",
        TITLE = "Image captioning: Semantic selection unit with stacked residual
attention",
        JOURNAL = IVC,
        VOLUME = "144",
        YEAR = "2024",
        PAGES = "104965",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118878"}

@article{bb122775,
        AUTHOR = "Ajankar, S. and Dutta, T.",
        TITLE = "Image-Relevant Entities Knowledge-Aware News Image Captioning",
        JOURNAL = MultMedMag,
        VOLUME = "31",
        YEAR = "2024",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "88-98",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118879"}

@article{bb122776,
        AUTHOR = "Dai, Z.Z. and Tran, V. and Markham, A. and Trigoni, N. and Rahman, M.A. and Wijayasingha, L.N.S. and Stankovic, J. and Li, C.",
        TITLE = "EgoCap and EgoFormer:
First-person image captioning with context fusion",
        JOURNAL = PRL,
        VOLUME = "181",
        YEAR = "2024",
        PAGES = "50-56",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118880"}

@article{bb122777,
        AUTHOR = "Shao, Z. and Han, J.G. and Debattista, K. and Pang, Y.W.",
        TITLE = "DCMSTRD: End-to-end Dense Captioning via Multi-Scale Transformer
Decoding",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "7581-7593",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118881"}

@article{bb122778,
        AUTHOR = "Cornia, M. and Baraldi, L. and Fiameni, G. and Cucchiara, R.",
        TITLE = "Generating More Pertinent Captions by Leveraging Semantics and Style on
Multi-Source Datasets",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1701-1720",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118882"}

@inproceedings{bb122779,
        AUTHOR = "Barraco, M. and Sarto, S. and Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "With a Little Help from your own Past: Prototypical Memory Networks
for Image Captioning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "3009-3019",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118883"}

@inproceedings{bb122780,
        AUTHOR = "Barraco, M. and Stefanini, M. and Cornia, M. and Cascianelli, S. and Baraldi, L. and Cucchiara, R.",
        TITLE = "CaMEL: Mean Teacher Learning for Image Captioning",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "4087-4094",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118884"}

@inproceedings{bb122781,
        AUTHOR = "Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Show, Control and Tell: A Framework for Generating Controllable and
Grounded Captions",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8299-8308",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118885"}

@article{bb122782,
        AUTHOR = "Wang, L.X. and Qiu, H.Q. and Qiu, B. and Meng, F.M. and Wu, Q.B. and Li, H.L.",
        TITLE = "TridentCap: Image-Fact-Style Trident Semantic Framework for Stylized
Image Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "3563-3575",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118886"}

@article{bb122783,
        AUTHOR = "Zhang, H. and Zeng, P.P. and Gao, L. and Lyu, X.Y. and Song, J.K. and Shen, H.T.",
        TITLE = "SPT: Spatial Pyramid Transformer for Image Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "4829-4842",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118887"}

@article{bb122784,
        AUTHOR = "Wang, H.Y. and Song, K. and Jiang, X. and He, Z.Q.",
        TITLE = "ragBERT: Relationship-aligned and grammar-wise BERT model for image
captioning",
        JOURNAL = IVC,
        VOLUME = "148",
        YEAR = "2024",
        PAGES = "105105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118888"}

@article{bb122785,
        AUTHOR = "Li, J.Y. and Zhang, L. and Zhang, K. and Hu, B. and Xie, H.T. and Mao, Z.D.",
        TITLE = "Cascade Semantic Prompt Alignment Network for Image Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "5266-5281",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118889"}

@inproceedings{bb122786,
        AUTHOR = "Ruan, J. and Wu, Y. and Wan, X.J. and Zhu, Y.S.",
        TITLE = "Describe Images in a Boring Way:
Towards Cross-Modal Sarcasm Generation",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5689-5698",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118890"}

@inproceedings{bb122787,
        AUTHOR = "Hirsch, E. and Tal, A.",
        TITLE = "CLID: Controlled-Length Image Descriptions with Limited Data",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5519-5529",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118891"}

@inproceedings{bb122788,
        AUTHOR = "Rotstein, N. and Bensaid, D. and Brody, S. and Ganz, R. and Kimmel, R.",
        TITLE = "FuseCap: Leveraging Large Language Models for Enriched Fused Image
Captions",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5677-5688",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118892"}

@inproceedings{bb122789,
        AUTHOR = "Petryk, S. and Whitehead, S. and Gonzalez, J.E. and Darrell, T.J. and Rohrbach, A. and Rohrbach, M.",
        TITLE = "Simple Token-Level Confidence Improves Caption Correctness",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "5730-5740",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118893"}

@inproceedings{bb122790,
        AUTHOR = "Sabir, A.",
        TITLE = "Word to Sentence Visual Semantic Similarity for Caption Generation:
Lessons Learned",
        BOOKTITLE = MVA23,
        YEAR = "2023",
        PAGES = "1-5",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118894"}

@inproceedings{bb122791,
        AUTHOR = "Verma, A. and Agarwal, S. and Arya, K.V. and Petrlik, I. and Esparza, R. and Rodriguez, C.",
        TITLE = "Image Captioning with Reinforcement Learning",
        BOOKTITLE = ICCVMI23,
        YEAR = "2023",
        PAGES = "1-7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118895"}

@inproceedings{bb122792,
        AUTHOR = "Wei, Y.C. and Li, L. and Geng, S.L.",
        TITLE = "Remote Sensing Image Captioning Using Hire-MLP",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "109-112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118896"}

@inproceedings{bb122793,
        AUTHOR = "Fan, J. and Liang, Y. and Liu, L. and Huang, S. and Zhang, L.",
        TITLE = "RCA-NOC: Relative Contrastive Alignment for Novel Object Captioning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "15464-15474",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118897"}

@inproceedings{bb122794,
        AUTHOR = "Li, R. and Sun, S.Y. and Elhoseiny, M. and Torr, P.",
        TITLE = "OxfordTVG-HIC: Can Machine Make Humorous Captions from Images?",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "20236-20246",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118898"}

@inproceedings{bb122795,
        AUTHOR = "Hu, A. and Chen, S.Z. and Zhang, L. and Jin, Q.",
        TITLE = "Explore and Tell: Embodied Visual Captioning in 3D Environments",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "2482-2491",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118899"}

@inproceedings{bb122796,
        AUTHOR = "Kang, W. and Mun, J. and Lee, S.J. and Roh, B.",
        TITLE = "Noise-aware Learning from Web-crawled Image-Text Data for Image
Captioning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "2930-2940",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118900"}

@inproceedings{bb122797,
        AUTHOR = "Fei, J.J. and Wang, T. and Zhang, J. and He, Z.Y. and Wang, C.J. and Zheng, F.",
        TITLE = "Transferable Decoding with Visual Entities for Zero-Shot Image
Captioning",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "3113-3123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118901"}

@inproceedings{bb122798,
        AUTHOR = "Kornblith, S. and Li, L. and Wang, Z. and Nguyen, T.",
        TITLE = "Guiding image captioning models toward more specific captions",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "15213-15223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118902"}

@inproceedings{bb122799,
        AUTHOR = "Kim, Y. and Kim, J. and Lee, B.K. and Shin, S. and Ro, Y.M.",
        TITLE = "Mitigating Dataset Bias in Image Captioning Through Clip
Confounder-Free Captioning Network",
        BOOKTITLE = ICIP23,
        YEAR = "2023",
        PAGES = "1720-1724",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT118903"}

Last update:Jul 18, 2024 at 20:50:34