@article{bb133600,
        AUTHOR = "Cao, S. and An, G. and Zheng, Z.X. and Wang, Z.Y.",
        TITLE = "Vision-Enhanced and Consensus-Aware Transformer for Image Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "7005-7018",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129635"}

@article{bb133601,
        AUTHOR = "Jiang, W.T. and Zhou, W. and Hu, H.F.",
        TITLE = "Double-Stream Position Learning Transformer Network for Image
Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "7706-7718",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129636"}

@article{bb133602,
        AUTHOR = "Li, J.C. and Zhou, W. and Wang, K. and Hu, H.F.",
        TITLE = "Triple-Stream Commonsense Circulation Transformer Network for Image
Captioning",
        JOURNAL = CVIU,
        VOLUME = "249",
        YEAR = "2024",
        PAGES = "104165",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129637"}

@article{bb133603,
        AUTHOR = "Hu, J.T. and Yang, Y. and Yao, L. and An, Y.Z. and Pan, L.",
        TITLE = "Position-guided transformer for image captioning",
        JOURNAL = IVC,
        VOLUME = "128",
        YEAR = "2022",
        PAGES = "104575",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129638"}

@article{bb133604,
        AUTHOR = "Wang, Z.G. and Shi, S. and Zhai, Z.R. and Wu, Y. and Yang, R.",
        TITLE = "ArCo: Attention-reinforced transformer with contrastive learning for
image captioning",
        JOURNAL = IVC,
        VOLUME = "128",
        YEAR = "2022",
        PAGES = "104570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129639"}

@article{bb133605,
        AUTHOR = "Li, Z.X. and Wei, J.H. and Huang, F.C. and Ma, H.F.",
        TITLE = "Modeling graph-structured contexts for image captioning",
        JOURNAL = IVC,
        VOLUME = "129",
        YEAR = "2023",
        PAGES = "104591",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129640"}

@article{bb133606,
        AUTHOR = "Zhang, J. and Xie, Y.S. and Ding, W.C. and Wang, Z.",
        TITLE = "Cross on Cross Attention: Deep Fusion Transformer for Image
Captioning",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "4257-4268",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129641"}

@article{bb133607,
        AUTHOR = "Lim, J.H. and Chan, C.S.",
        TITLE = "Mask-guided network for image captioning",
        JOURNAL = PRL,
        VOLUME = "173",
        YEAR = "2023",
        PAGES = "79-86",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129642"}

@article{bb133608,
        AUTHOR = "Li, Z.X. and Su, Q. and Chen, T.Y.",
        TITLE = "External knowledge-assisted Transformer for image captioning",
        JOURNAL = IVC,
        VOLUME = "140",
        YEAR = "2023",
        PAGES = "104864",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129643"}

@article{bb133609,
        AUTHOR = "Chen, J.Q.",
        TITLE = "Transform, contrast and tell:
Coherent entity-aware multi-image captioning",
        JOURNAL = CVIU,
        VOLUME = "238",
        YEAR = "2024",
        PAGES = "103878",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129644"}

@article{bb133610,
        AUTHOR = "Yang, X.B. and Tian, X. and Wu, J.S. and Yang, X.C. and Ma, S. and Qi, X. and Hou, Z.Q.",
        TITLE = "LLAFN-Generator: Learnable linear-attention with fast-normalization
for large-scale image captioning",
        JOURNAL = CVIU,
        VOLUME = "248",
        YEAR = "2024",
        PAGES = "104088",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129645"}

@article{bb133611,
        AUTHOR = "Yi, Y.H. and Liang, Y.K. and Kong, D.Z. and Tang, Z.W. and Peng, J.B.",
        TITLE = "Tag-inferring and tag-guided Transformer for image captioning",
        JOURNAL = IET-CV,
        VOLUME = "18",
        YEAR = "2024",
        NUMBER = "6",
        PAGES = "801-812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129646"}

@article{bb133612,
        AUTHOR = "Caffagni, D. and Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Augmenting and mixing Transformers with synthetic data for image
captioning",
        JOURNAL = IVC,
        VOLUME = "162",
        YEAR = "2025",
        PAGES = "105661",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129647"}

@inproceedings{bb133613,
        AUTHOR = "Caffagni, D. and Barraco, M. and Cornia, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Synthcap: Augmenting Transformers with Synthetic Data for Image
Captioning",
        BOOKTITLE = CIAP23,
        YEAR = "2023",
        PAGES = "I:112-123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129648"}

@inproceedings{bb133614,
        AUTHOR = "Song, J.Y. and Pan, R.J. and Zhou, J. and Yang, H.",
        TITLE = "M-rat: a Multi-grained Retrieval Augmentation Transformer for Image
Captioning",
        BOOKTITLE = ACCV24,
        YEAR = "2024",
        PAGES = "III: 185-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129649"}

@inproceedings{bb133615,
        AUTHOR = "Lou, L.S. and Lu, K. and Xue, J.",
        TITLE = "Improved Transformer with Parallel Encoders for Image Captioning",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "4072-4075",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129650"}

@inproceedings{bb133616,
        AUTHOR = "Wang, Y.H. and Shang, L.",
        TITLE = "Generating Spatial-aware Captions for TextCaps",
        BOOKTITLE = "ICPR22",
        YEAR = "2022",
        PAGES = "379-385",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129651"}

@inproceedings{bb133617,
        AUTHOR = "Feng, Y. and Maeda, K. and Ogawa, T. and Haseyama, M.",
        TITLE = "Human-Centric Image Retrieval with Gaze-Based Image Captioning",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "3828-3832",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129652"}

@inproceedings{bb133618,
        AUTHOR = "Yang, X. and Wang, Y. and Chen, H. and Li, J.",
        TITLE = "CSTNET: Enhancing Global-To-Local Interactions for Image Captioning",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "1861-1865",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129653"}

@inproceedings{bb133619,
        AUTHOR = "Nguyen, V.Q. and Suganuma, M. and Okatani, T.",
        TITLE = "GRIT: Faster and Better Image Captioning Transformer Using Dual Visual
Features",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XXXVI:167-184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129654"}

@inproceedings{bb133620,
        AUTHOR = "Vo, D.M. and Chen, H. and Sugimoto, A. and Nakayama, H.",
        TITLE = "NOC-REK: Novel Object Captioning with Retrieved Vocabulary from
External Knowledge",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "17979-17987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129655"}

@inproceedings{bb133621,
        AUTHOR = "Yuan, Z.H. and Yan, X. and Liao, Y.H. and Guo, Y. and Li, G.B. and Cui, S.G. and Li, Z.",
        TITLE = "X-Trans2Cap:
Cross-Modal Knowledge Transfer using Transformer for 3D Dense Captioning",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "8553-8563",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129656"}

@inproceedings{bb133622,
        AUTHOR = "Liu, B. and Wang, D. and Yang, X. and Zhou, Y. and Yao, R. and Shao, Z.W. and Zhao, J.Q.",
        TITLE = "Show, Deconfound and Tell: Image Captioning with Causal Inference",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "18020-18029",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129657"}

@inproceedings{bb133623,
        AUTHOR = "Fang, Z.Y. and Wang, J.F. and Hu, X.W. and Liang, L. and Gan, Z. and Wang, L.J. and Yang, Y.Z. and Liu, Z.C.",
        TITLE = "Injecting Semantic Concepts into End-to-End Image Captioning",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "17988-17998",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129658"}

@inproceedings{bb133624,
        AUTHOR = "Li, Y. and Pan, Y.W. and Yao, T. and Mei, T.",
        TITLE = "Comprehending and Ordering Semantics for Image Captioning",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "17969-17978",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129659"}

@inproceedings{bb133625,
        AUTHOR = "Fei, Z.C. and Yan, X. and Wang, S.H. and Tian, Q.",
        TITLE = "DeeCap: Dynamic Early Exiting for Efficient Image Captioning",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "12206-12216",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129660"}

@inproceedings{bb133626,
        AUTHOR = "Wu, M.R. and Zhang, X.Y. and Sun, X.S. and Zhou, Y. and Chen, C. and Gu, J.X. and Sun, X. and Ji, R.R.",
        TITLE = "DIFNet: Boosting Visual Information Flow for Image Captioning",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "17999-18008",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129661"}

@inproceedings{bb133627,
        AUTHOR = "Rio Torto, I. and Cardoso, J.S. and Teixeira, L.F.",
        TITLE = "From Captions to Explanations: A Multimodal Transformer-based
Architecture for Natural Language Explanation Generation",
        BOOKTITLE = IbPRIA22,
        YEAR = "2022",
        PAGES = "54-65",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129662"}

@inproceedings{bb133628,
        AUTHOR = "Chen, H.S. and Wang, Y. and Yang, X. and Li, J.",
        TITLE = "Captioning Transformer With Scene Graph Guiding",
        BOOKTITLE = ICIP21,
        YEAR = "2021",
        PAGES = "2538-2542",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129663"}

@inproceedings{bb133629,
        AUTHOR = "Zhang, X.Y. and Sun, X.S. and Luo, Y.P. and Ji, J.Y. and Zhou, Y. and Wu, Y.J. and Huang, F.Y. and Ji, R.R.",
        TITLE = "RSTNet:
Captioning with Adaptive Attention on Visual and Non-Visual Words",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "15460-15469",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129664"}

@inproceedings{bb133630,
        AUTHOR = "He, S. and Liao, W.T. and Tavakoli, H.R. and Yang, M. and Rosenhahn, B. and Pugeault, N.",
        TITLE = "Image Captioning Through Image Transformer",
        BOOKTITLE = ACCV20,
        YEAR = "2020",
        PAGES = "IV:153-169",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129665"}

@inproceedings{bb133631,
        AUTHOR = "Cornia, M. and Stefanini, M. and Baraldi, L. and Cucchiara, R.",
        TITLE = "Meshed-Memory Transformer for Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10575-10584",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129666"}

@inproceedings{bb133632,
        AUTHOR = "Tran, A. and Mathews, A. and Xie, L.",
        TITLE = "Transform and Tell: Entity-Aware News Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "13032-13042",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129667"}

@inproceedings{bb133633,
        AUTHOR = "Li, G. and Zhu, L. and Liu, P. and Yang, Y.",
        TITLE = "Entangled Transformer for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8927-8936",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT129668"}

@article{bb133634,
        AUTHOR = "Sharma, D. and Chattopadhyay, C.",
        TITLE = "High-level feature aggregation for fine-grained architectural floor
plan retrieval",
        JOURNAL = IET-CV,
        VOLUME = "12",
        YEAR = "2018",
        NUMBER = "5",
        MONTH = "August",
        PAGES = "702-709",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129669"}

@inproceedings{bb133635,
        AUTHOR = "Sharma, D. and Chattopadhyay, C. and Harit, G.",
        TITLE = "A unified framework for semantic matching of architectural floorplans",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "2422-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129670"}

@article{bb133636,
        AUTHOR = "Ham, B. and Cho, M.S. and Schmid, C. and Ponce, J.",
        TITLE = "Proposal Flow: Semantic Correspondences from Object Proposals",
        JOURNAL = PAMI,
        VOLUME = "40",
        YEAR = "2018",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1711-1725",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129671"}

@inproceedings{bb133637,
        AUTHOR = "Ham, B. and Cho, M.S. and Schmid, C. and Ponce, J.",
        TITLE = "Proposal Flow",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "3475-3484",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129672"}

@article{bb133638,
        AUTHOR = "Xiao, T.H. and Liu, S.F. and de Mello, S. and Yu, Z.D. and Kautz, J. and Yang, M.H.",
        TITLE = "Learning Contrastive Representation for Semantic Correspondence",
        JOURNAL = IJCV,
        VOLUME = "130",
        YEAR = "2022",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1293-1309",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129673"}

@article{bb133639,
        AUTHOR = "Yang, M.H. and Kautz, J. and Yu, Z.D. and de Mello, S. and Liu, S.F. and Xiao, T.H.",
        TITLE = "Learning Contrastive Representation for Semantic Correspondence",
        JOURNAL = IJCV,
        VOLUME = "130",
        YEAR = "2022",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1607-1607",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129673"}

@inproceedings{bb133640,
        AUTHOR = "Yuan, W.T. and Eckart, B. and Kim, K. and Jampani, V. and Fox, D. and Kautz, J.",
        TITLE = "DeepGMR: Learning Latent Gaussian Mixture Models for Registration",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "V:733-750",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129674"}

@inproceedings{bb133641,
        AUTHOR = "Eckart, B. and Kim, K. and Kautz, J.",
        TITLE = "HGMR: Hierarchical Gaussian Mixtures for Adaptive 3D Registration",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 730-746",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129675"}

@article{bb133642,
        AUTHOR = "He, J.F. and Zhang, T.Z. and Zheng, Y.H. and Xu, M.L. and Zhang, Y.D. and Wu, F.",
        TITLE = "Consistency Graph Modeling for Semantic Correspondence",
        JOURNAL = IP,
        VOLUME = "30",
        YEAR = "2021",
        PAGES = "4932-4946",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129676"}

@article{bb133643,
        AUTHOR = "Jeon, S. and Kim, S. and Min, D.B. and Sohn, K.H.",
        TITLE = "Pyramidal Semantic Correspondence Networks",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "9102-9118",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129677"}

@article{bb133644,
        AUTHOR = "Cao, C.Q. and Zhang, Y.N.",
        TITLE = "Learning to Compare Relation:
Semantic Alignment for Few-Shot Learning",
        JOURNAL = IP,
        VOLUME = "31",
        YEAR = "2022",
        PAGES = "1462-1474",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129678"}

@article{bb133645,
        AUTHOR = "Cheng, J. and Hao, F.S. and Liu, L. and Tao, D.C.",
        TITLE = "Imposing Semantic Consistency of Local Descriptors for Few-Shot
Learning",
        JOURNAL = IP,
        VOLUME = "31",
        YEAR = "2022",
        PAGES = "1587-1600",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129679"}

@article{bb133646,
        AUTHOR = "Hao, F.S. and He, F.X. and Cheng, J. and Tao, D.C.",
        TITLE = "Global-Local Interplay in Semantic Alignment for Few-Shot Learning",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4351-4363",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129680"}

@inproceedings{bb133647,
        AUTHOR = "Hao, F.S. and He, F.X. and Cheng, J. and Wang, L. and Cao, J. and Tao, D.C.",
        TITLE = "Collect and Select:
Semantic Alignment Metric Learning for Few-Shot Learning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8459-8468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129681"}

@article{bb133648,
        AUTHOR = "Liu, H. and Wang, T. and Li, Y.D. and Lang, C.Y. and Jin, Y. and Ling, H.B.",
        TITLE = "Joint Graph Learning and Matching for Semantic Feature Correspondence",
        JOURNAL = PR,
        VOLUME = "134",
        YEAR = "2023",
        PAGES = "109059",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129682"}

@article{bb133649,
        AUTHOR = "Sachdeva, R. and Cordeiro, F.R. and Belagiannis, V. and Reid, I.D. and Carneiro, G.",
        TITLE = "ScanMix: Learning from Severe Label Noise via Semantic Clustering and
Semi-Supervised Learning",
        JOURNAL = PR,
        VOLUME = "134",
        YEAR = "2023",
        PAGES = "109121",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129683"}

@article{bb133650,
        AUTHOR = "Xu, X. and Xu, X. and Shen, F.M. and Li, Y.J.",
        TITLE = "Semantic-Aligned Attention With Refining Feature Embedding for
Few-Shot Image Classification",
        JOURNAL = ITS,
        VOLUME = "23",
        YEAR = "2022",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "25458-25468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129684"}

@article{bb133651,
        AUTHOR = "Yang, Z.Q. and Zhang, Y.Q. and Du, Y.X. and Tong, C.",
        TITLE = "Semantic-aligned reinforced attention model for zero-shot learning",
        JOURNAL = IVC,
        VOLUME = "128",
        YEAR = "2022",
        PAGES = "104586",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129685"}

@article{bb133652,
        AUTHOR = "Wang, J. and Zhang, Z.Q. and Shi, Z.H. and Cai, J.Y. and Ji, S.W. and Wu, F.",
        TITLE = "Duality-Induced Regularizer for Semantic Matching Knowledge Graph
Embeddings",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1652-1667",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129686"}

@article{bb133653,
        AUTHOR = "Liu, W.X. and Zhong, X. and Jia, X.M. and Jiang, K. and Lin, C.W.",
        TITLE = "Actor-Aware Alignment Network for Action Recognition",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "2597-2601",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129687"}

@article{bb133654,
        AUTHOR = "Wang, Z. and Fu, Z.H. and Guo, Y.L. and Li, Z. and Yu, Q.F.",
        TITLE = "Local-to-Global Cost Aggregation for Semantic Correspondence",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "1209-1222",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129688"}

@article{bb133655,
        AUTHOR = "Xu, W.J. and Wang, J.N. and Wei, Z.W. and Peng, M. and Wu, Y.R.",
        TITLE = "Deep Semantic-Visual Alignment for zero-shot remote sensing image
scene classification",
        JOURNAL = PandRS,
        VOLUME = "198",
        YEAR = "2023",
        PAGES = "140-152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129689"}

@article{bb133656,
        AUTHOR = "Yang, J.Q. and Shen, Q. and Xie, C.",
        TITLE = "Generation-based contrastive model with semantic alignment for
generalized zero-shot learning",
        JOURNAL = IVC,
        VOLUME = "137",
        YEAR = "2023",
        PAGES = "104758",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129690"}

@article{bb133657,
        AUTHOR = "Duan, Z.H. and Ma, Z. and Zhu, F.Q.",
        TITLE = "Unified Architecture Adaptation for Compressed Domain Semantic
Inference",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "4108-4121",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129691"}

@article{bb133658,
        AUTHOR = "Xu, H.Y. and Liao, J. and Liu, H.P. and Sun, Y.X.",
        TITLE = "Learning Semantic Alignment Using Global Features and Multi-Scale
Confidence",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "897-910",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129692"}

@article{bb133659,
        AUTHOR = "Liu, J. and Xie, J.L. and Zhou, F.Y. and He, S.F.",
        TITLE = "Triadic temporal-semantic alignment for weakly-supervised video
moment retrieval",
        JOURNAL = PR,
        VOLUME = "156",
        YEAR = "2024",
        PAGES = "110819",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129693"}

@article{bb133660,
        AUTHOR = "Zhang, T. and Fang, H. and Zhang, H. and Gao, J.L. and Lu, X. and Nie, X. and Yin, Y.L.",
        TITLE = "Learning Feature Semantic Matching for Spatio-Temporal Video
Grounding",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "9268-9279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129694"}

@article{bb133661,
        AUTHOR = "Wu, R.J. and Guo, W. and Liu, Y. and Sun, C.H.",
        TITLE = "High-Precision Heterogeneous Satellite Image Manipulation
Localization: Feature Point Rules and Semantic Similarity Measurement",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "19",
        PAGES = "3719",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129695"}

@article{bb133662,
        AUTHOR = "Giang, K.T. and Song, S. and Jo, S.",
        TITLE = "TopicFM+: Boosting Accuracy and Efficiency of Topic-Assisted Feature
Matching",
        JOURNAL = IP,
        VOLUME = "33",
        YEAR = "2024",
        PAGES = "6016-6028",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129696"}

@article{bb133663,
        AUTHOR = "Liao, G. and Zhou, K. and Bao, Z.Y. and Liu, K.L. and Li, Q.",
        TITLE = "OV-NeRF: Open-Vocabulary Neural Radiance Fields With Vision and
Language Foundation Models for 3D Semantic Understanding",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12923-12936",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129697"}

@article{bb133664,
        AUTHOR = "Shi, W. and Zhu, R.H. and Li, S.",
        TITLE = "Unsupervised Class-Imbalanced Domain Adaptation With Pairwise
Adversarial Training and Semantic Alignment",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12411-12424",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129698"}

@article{bb133665,
        AUTHOR = "Zhang, H. and Xu, L.M. and Lai, S.Q. and Shao, W.Q. and Zheng, N.N. and Luo, P. and Qiao, Y. and Zhang, K.P.",
        TITLE = "Open-Vocabulary Animal Keypoint Detection with Semantic-Feature
Matching",
        JOURNAL = IJCV,
        VOLUME = "132",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "5741-5758",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129699"}

@article{bb133666,
        AUTHOR = "Xu, L.M. and Li, H.Q. and Zheng, B. and Li, W.S. and Lv, J.C.",
        TITLE = "Deep Lifelong Cross-Modal Hashing",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "13478-13493",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129700"}

@article{bb133667,
        AUTHOR = "Dong, M.P. and Li, F. and Li, Z.B. and Liu, X.",
        TITLE = "PRSN: Prototype resynthesis network with cross-image semantic
alignment for few-shot image classification",
        JOURNAL = PR,
        VOLUME = "159",
        YEAR = "2025",
        PAGES = "111122",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129701"}

@article{bb133668,
        AUTHOR = "Gonzalez, L.H.R. and Florez, S.L. and Gonzalez Briones, A. and de la Prieta, F.",
        TITLE = "Semantic scene understanding through advanced object context analysis
in image",
        JOURNAL = CVIU,
        VOLUME = "252",
        YEAR = "2025",
        PAGES = "104299",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129702"}

@article{bb133669,
        AUTHOR = "Shi, Y. and Li, R.X. and Gan, L. and Zhan, D.C. and Ye, H.J.",
        TITLE = "Generalized Conditional Similarity Learning via Semantic Matching",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "3847-3862",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129703"}

@article{bb133670,
        AUTHOR = "Dong, S.H. and Xie, W.Y. and Yang, D. and Li, Y.S. and Zhang, J.Q. and Tian, J.Y. and Lei, J.",
        TITLE = "SeaDATE: Remedy Dual-Attention Transformer With Semantic Alignment
via Contrast Learning for Multimodal Object Detection",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "4713-4726",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129704"}

@article{bb133671,
        AUTHOR = "Tan, Y.B. and Wang, H. and Cai, R.F. and Gao, L.L. and Yu, Z.H. and Li, X.",
        TITLE = "Spatial Proximity Relations-Driven Semantic Representation for
Geospatial Entity Categories",
        JOURNAL = IJGI,
        VOLUME = "14",
        YEAR = "2025",
        NUMBER = "6",
        PAGES = "233",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129705"}

@article{bb133672,
        AUTHOR = "Wei, Z. and Hou, Z.Y. and Zhou, X.Z.",
        TITLE = "Eliminating Non-Overlapping Semantic Misalignment for Cross-Modal
Medical Retrieval",
        JOURNAL = SPLetters,
        VOLUME = "32",
        YEAR = "2025",
        PAGES = "3510-3514",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129706"}

@article{bb133673,
        AUTHOR = "Wang, Z.H. and Du, S.L. and Yan, Y.P. and Xiao, G. and Lu, X.B.",
        TITLE = "Tex2Sem: Learning From Textures to Semantics for Robust Semantic
Correspondence",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "10875-10890",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129707"}

@inproceedings{bb133674,
        AUTHOR = "Wang, S. and Lin, W. and Huang, H. and Wang, H.T. and Cai, S. and Han, W. and Jin, T. and Chen, J.Y. and Sun, J.C. and Zhu, J. and Zhao, Z.",
        TITLE = "Towards Transformer-Based Aligned Generation with Self-Coherence
Guidance",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18455-18464",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129708"}

@inproceedings{bb133675,
        AUTHOR = "Jose, C. and Moutakanni, T. and Kang, D. and Baldassarre, F. and Darcet, T. and Xu, H. and Li, D. and Szafraniec, M. and Ramamonjisoa, M. and Oquab, M. and Simeoni, O. and Vo, H.V. and Labatut, P. and Bojanowski, P.",
        TITLE = "DINOv2 Meets Text: A Unified Framework for Image- and Pixel-Level
Vision-Language Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24905-24916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129709"}

@inproceedings{bb133676,
        AUTHOR = "Tang, Y.T. and Guo, Y.X. and Li, D. and Peng, C.",
        TITLE = "SPARS3R: Semantic Prior Alignment and Regularization for Sparse 3D
Reconstruction",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "26810-26821",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129710"}

@inproceedings{bb133677,
        AUTHOR = "Ding, Z.H. and Chen, G. and Zhang, Q. and Wu, H. and Qin, J.",
        TITLE = "CSC-PA: Cross-image Semantic Correlation via Prototype Attentions for
Single-network Semi-supervised Breast Tumor Segmentation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "15632-15641",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129711"}

@inproceedings{bb133678,
        AUTHOR = "Huang, J. and Liu, T. and Wu, Y.H. and Qu, X. and Liu, L.Q. and Hu, X.L.",
        TITLE = "MTADiffusion: Mask Text Alignment Diffusion Model for Object
Inpainting",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18325-18334",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129712"}

@inproceedings{bb133679,
        AUTHOR = "Qian, Q. and Chen, H.S. and Tomizuka, M. and Keutzer, K. and Wang, Q.Q. and Xu, C.F.",
        TITLE = "Bridging Viewpoint Gaps: Geometric Reasoning Boosts Semantic
Correspondence",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "11579-11589",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129713"}

@inproceedings{bb133680,
        AUTHOR = "Zhang, Z.X. and Wang, Y.X. and Cheng, L. and Zhong, Z. and Guo, D. and Wang, M.",
        TITLE = "ASAP: Advancing Semantic Alignment Promotes Multi-Modal Manipulation
Detecting and Grounding",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "4005-4014",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129714"}

@inproceedings{bb133681,
        AUTHOR = "Feng, F. and Xie, Y.C. and Yang, X. and Wang, J. and Geng, X.",
        TITLE = "Redefining  in Dictionary: Towards an Enhanced Semantic
Understanding of Creative Generation",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "18444-18454",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129715"}

@inproceedings{bb133682,
        AUTHOR = "Wandel, K. and Wang, H.S.",
        TITLE = "SemAlign3D: Semantic Correspondence between RGB-Images through
Aligning 3D Object-Class Representations",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "1138-1147",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129716"}

@inproceedings{bb133683,
        AUTHOR = "Fundel, F. and Schusterbauer, J. and Hu, V.T. and Ommer, B.",
        TITLE = "Distillation of Diffusion Features for Semantic Correspondence",
        BOOKTITLE = WACV25,
        YEAR = "2025",
        PAGES = "6762-6774",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129717"}

@inproceedings{bb133684,
        AUTHOR = "Ju, Y.C. and Hu, K.Z. and Zhang, G. and Zhang, G. and Jiang, M. and Xu, H.Z.",
        TITLE = "Robo-abc: Affordance Generalization Beyond Categories via Semantic
Correspondence for Robot Manipulation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLI: 222-239",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129718"}

@inproceedings{bb133685,
        AUTHOR = "Wang, P.Y. and Ikeda, T. and Lee, R. and Nishiwaki, K.",
        TITLE = "GS-Pose: Category-level Object Pose Estimation via Geometric and
Semantic Correspondence",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXVII: 108-126",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129719"}

@inproceedings{bb133686,
        AUTHOR = "Park, C. and Kim, S. and Park, J. and Cho, M.",
        TITLE = "Learning SO(3)-Invariant Semantic Correspondence via Local Shape
Transform",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "22978-22987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129720"}

@inproceedings{bb133687,
        AUTHOR = "Mariotti, O. and Aodha, O.M. and Bilen, H.",
        TITLE = "Improving Semantic Correspondence with Viewpoint-Guided Spherical
Maps",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "19521-19530",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129721"}

@inproceedings{bb133688,
        AUTHOR = "Sun, Y.X. and Yin, Z.Y. and Wang, H.B. and Wang, Y. and Qiu, X.P. and Ge, W.F. and Zhang, W.Q.",
        TITLE = "Pixel-Level Semantic Correspondence Through Layout-Aware
Representation Learning and Multi-Scale Matching Integration",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "17047-17056",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129722"}

@inproceedings{bb133689,
        AUTHOR = "Park, J.H. and Lee, G. and Park, S. and Cho, S.I.",
        TITLE = "Not All Classes Stand on Same Embeddings:
Calibrating a Semantic Distance with Metric Tensor",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "17722-17731",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129723"}

@inproceedings{bb133690,
        AUTHOR = "Gu, Y.C. and Zhou, Y.P. and Wu, B. and Yu, L.C. and Liu, J.W. and Zhao, R. and Wu, J.Z.J. and Zhang, D.J.H. and Shou, M.Z. and Tang, K.",
        TITLE = "VideoSwap: Customized Video Subject Swapping with Interactive
Semantic Point Correspondence",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "7621-7630",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129724"}

@inproceedings{bb133691,
        AUTHOR = "Kim, S. and Min, J. and Cho, M.",
        TITLE = "Efficient Semantic Matching with Hypercolumn Correlation",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "138-147",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129725"}

@inproceedings{bb133692,
        AUTHOR = "Xie, X.J. and Liu, F. and Gai, S. and Huang, Z. and Hu, M.H. and Wang, A.",
        TITLE = "Hss: A Hierarchical Semantic Similarity Hard Negative Sampling Method
for Dense Retrievers",
        BOOKTITLE = MMMod23,
        YEAR = "2023",
        PAGES = "II: 301-312",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129726"}

@inproceedings{bb133693,
        AUTHOR = "Cai, R. and Tung, J. and Wang, Q.Q. and Averbuch Elor, H. and Hariharan, B. and Snavely, N.",
        TITLE = "Doppelgangers: Learning to Disambiguate Images of Similar Structures",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "34-44",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129727"}

@inproceedings{bb133694,
        AUTHOR = "Huang, Y.W. and Sun, Y.X. and Lai, C.H. and Xu, Q. and Wang, X.M. and Shen, X.L. and Ge, W.F.",
        TITLE = "Weakly Supervised Learning of Semantic Correspondence through
Cascaded Online Correspondence Refinement",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "16208-16217",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129728"}

@inproceedings{bb133695,
        AUTHOR = "Shtedritski, A. and Vedaldi, A. and Rupprecth, C.",
        TITLE = "Learning Universal Semantic Correspondences with No Supervision and
Automatic Data Curation",
        BOOKTITLE = LIMIT23,
        YEAR = "2023",
        PAGES = "933-943",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129729"}

@inproceedings{bb133696,
        AUTHOR = "Tang, C.F. and Xie, L.X. and Zhang, X.P. and Hu, X.L. and Tian, Q.",
        TITLE = "Visual Recognition by Request",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "15265-15274",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129730"}

@inproceedings{bb133697,
        AUTHOR = "Sun, Y.X. and Huang, Y.W. and Guo, H.J. and Zhao, Y.Z. and Wu, R.M. and Yu, Y.Z. and Ge, W.F. and Zhang, W.Q.",
        TITLE = "MISC210K: A Large-Scale Dataset for Multi-Instance Semantic
Correspondence",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "7121-7130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129731"}

@inproceedings{bb133698,
        AUTHOR = "Sabir, A. and Moreno Noguer, F. and Padro, L.",
        TITLE = "Visual Semantic Relatedness Dataset for Image Captioning",
        BOOKTITLE = ODRUM23,
        YEAR = "2023",
        PAGES = "5598-5606",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129732"}

@inproceedings{bb133699,
        AUTHOR = "Zeng, Z.Q. and Zhang, H. and Lu, R.Y. and Wang, D.S. and Chen, B. and Wang, Z.J.",
        TITLE = "ConZIC: Controllable Zero-shot Image Captioning by Sampling-Based
Polishing",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "23465-23476",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT129733"}

Last update:Nov 10, 2025 at 14:27:42