@article{bb250600,
AUTHOR = "Peng, Y. and Chi, J.",
TITLE = "Unsupervised Cross-Media Retrieval Using Domain Adaptation With Scene
Graph",
JOURNAL = CirSysVideo,
VOLUME = "30",
YEAR = "2020",
NUMBER = "11",
MONTH = "November",
PAGES = "4368-4379",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245435"}
@article{bb250601,
AUTHOR = "Zhu, L. and Song, J.Y. and Zhu, X.F. and Zhang, C.Y. and Zhang, S.C. and Yuan, X.P.",
TITLE = "Adversarial Learning-Based Semantic Correlation Representation for
Cross-Modal Retrieval",
JOURNAL = MultMedMag,
VOLUME = "27",
YEAR = "2020",
NUMBER = "4",
MONTH = "October",
PAGES = "79-90",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245436"}
@article{bb250602,
AUTHOR = "Zhu, L. and Zhang, C.Y. and Song, J.Y. and Zhang, S.C. and Tian, C.W. and Zhu, X.H.",
TITLE = "Deep Multigraph Hierarchical Enhanced Semantic Representation for
Cross-Modal Retrieval",
JOURNAL = MultMedMag,
VOLUME = "29",
YEAR = "2022",
NUMBER = "3",
MONTH = "July",
PAGES = "17-26",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245437"}
@article{bb250603,
AUTHOR = "Chaudhuri, U. and Banerjee, B. and Bhattacharya, A. and Datcu, M.",
TITLE = "CrossATNet: A novel cross-attention based framework for sketch-based
image retrieval",
JOURNAL = IVC,
VOLUME = "104",
YEAR = "2020",
PAGES = "104003",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245438"}
@article{bb250604,
AUTHOR = "Zhang, Y. and Zhou, W. and Wang, M. and Tian, Q. and Li, H.",
TITLE = "Deep Relation Embedding for Cross-Modal Retrieval",
JOURNAL = IP,
VOLUME = "30",
YEAR = "2021",
PAGES = "617-627",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245439"}
@article{bb250605,
AUTHOR = "Zhang, L. and Chen, L.T. and Ou, W.H. and Zhou, C.",
TITLE = "Semi-supervised cross-modal representation learning with GAN-based
Asymmetric Transfer Network",
JOURNAL = JVCIR,
VOLUME = "73",
YEAR = "2020",
PAGES = "102899",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245440"}
@article{bb250606,
AUTHOR = "Matsubara, T.",
TITLE = "Target-Oriented Deformation of Visual-Semantic Embedding Space",
JOURNAL = IEICE,
VOLUME = "E104-D",
YEAR = "2021",
NUMBER = "1",
MONTH = "January",
PAGES = "24-33",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245441"}
@article{bb250607,
AUTHOR = "Wu, Y. and Wang, S. and Song, G. and Huang, Q.",
TITLE = "Augmented Adversarial Training for Cross-Modal Retrieval",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "559-571",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245442"}
@article{bb250608,
AUTHOR = "Qi, M. and Qin, J. and Yang, Y. and Wang, Y. and Luo, J.",
TITLE = "Semantics-Aware Spatial-Temporal Binaries for Cross-Modal Video
Retrieval",
JOURNAL = IP,
VOLUME = "30",
YEAR = "2021",
PAGES = "2989-3004",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245443"}
@article{bb250609,
AUTHOR = "Wu, J.L. and Xie, X.X. and Nie, L.Q. and Lin, Z.C. and Zha, H.B.",
TITLE = "Reconstruction regularized low-rank subspace learning for cross-modal
retrieval",
JOURNAL = PR,
VOLUME = "113",
YEAR = "2021",
PAGES = "107813",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245444"}
@article{bb250610,
AUTHOR = "Shu, X. and Zhao, G.Y.",
TITLE = "Scalable multi-label canonical correlation analysis for cross-modal
retrieval",
JOURNAL = PR,
VOLUME = "115",
YEAR = "2021",
PAGES = "107905",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245445"}
@article{bb250611,
AUTHOR = "Song, G. and Tan, X.Y.",
TITLE = "Real-world Cross-modal Retrieval via Sequential Learning",
JOURNAL = MultMed,
VOLUME = "23",
YEAR = "2021",
PAGES = "1708-1721",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245446"}
@inproceedings{bb250612,
AUTHOR = "Song, G. and Tan, X.Y.",
TITLE = "Sequential Learning for Cross-Modal Retrieval",
BOOKTITLE = CroMoL19,
YEAR = "2019",
PAGES = "4531-4539",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245447"}
@article{bb250613,
AUTHOR = "Chen, W. and Liu, Y. and Bakker, E.M. and Lew, M.S.",
TITLE = "Integrating information theory and adversarial learning for
cross-modal retrieval",
JOURNAL = PR,
VOLUME = "117",
YEAR = "2021",
PAGES = "107983",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245448"}
@article{bb250614,
AUTHOR = "Huang, Z.Y. and Zhou, J.T.Y. and Zhu, H.Y. and Zhang, C.Q. and Lv, J.C. and Peng, X.",
TITLE = "Deep Spectral Representation Learning from Multi-View Data",
JOURNAL = IP,
VOLUME = "30",
YEAR = "2021",
PAGES = "5352-5362",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245449"}
@article{bb250615,
AUTHOR = "Wen, X. and Han, Z.Z. and Liu, Y.S.",
TITLE = "CMPD: Using Cross Memory Network With Pair Discrimination for
Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "6",
MONTH = "June",
PAGES = "2427-2437",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245450"}
@article{bb250616,
AUTHOR = "Liu, J.H. and Yang, M. and Li, C.M. and Xu, R.F.",
TITLE = "Improving Cross-Modal Image-Text Retrieval With Teacher-Student
Learning",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "8",
MONTH = "August",
PAGES = "3242-3253",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245451"}
@article{bb250617,
AUTHOR = "Zhang, L. and Wu, X.Q.",
TITLE = "Multi-task framework based on feature separation and reconstruction
for cross-modal retrieval",
JOURNAL = PR,
VOLUME = "122",
YEAR = "2022",
PAGES = "108217",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245452"}
@article{bb250618,
AUTHOR = "Liu, F. and Gao, C.Q. and Sun, Y.Q. and Zhao, Y. and Yang, F. and Qin, A. and Meng, D.Y.",
TITLE = "Infrared and Visible Cross-Modal Image Retrieval Through Shared
Features",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "11",
MONTH = "November",
PAGES = "4485-4496",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245453"}
@article{bb250619,
AUTHOR = "Wang, C.Y. and Li, L. and Yan, C.G. and Wang, Z. and Sun, Y.Q. and Zhang, J.Y.",
TITLE = "Cross-modal semantic correlation learning by Bi-CNN network",
JOURNAL = IET-IPR,
VOLUME = "15",
YEAR = "2021",
NUMBER = "14",
PAGES = "3674-3684",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245454"}
@inproceedings{bb250620,
AUTHOR = "Chakraborty, B. and Wang, P. and Wang, L.",
TITLE = "Inter-Modality Fusion Based Attention for Zero-Shot Cross-Modal
Retrieval",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2648-2652",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245455"}
@article{bb250621,
AUTHOR = "Shin, A. and Ishii, M. and Narihira, T.",
TITLE = "Perspectives and Prospects on Transformer Architecture for Cross-Modal
Tasks with Language and Vision",
JOURNAL = IJCV,
VOLUME = "130",
YEAR = "2022",
NUMBER = "2",
MONTH = "February",
PAGES = "435-454",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245456"}
@article{bb250622,
AUTHOR = "Ji, Z. and Wang, H.R. and Han, J.G. and Pang, Y.W.",
TITLE = "SMAN: Stacked Multimodal Attention Network for Cross-Modal Image-Text
Retrieval",
JOURNAL = Cyber,
VOLUME = "52",
YEAR = "2022",
NUMBER = "2",
MONTH = "February",
PAGES = "1086-1097",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245457"}
@article{bb250623,
AUTHOR = "Ma, J.J. and Shi, D. and Tang, X. and Zhang, X.R. and Jiao, L.C.",
TITLE = "Dual Modality Collaborative Learning for Cross-Source Remote Sensing
Retrieval",
JOURNAL = RS,
VOLUME = "14",
YEAR = "2022",
NUMBER = "6",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245458"}
@article{bb250624,
AUTHOR = "Huang, Y. and Wang, J.D. and Wang, L.",
TITLE = "Few-Shot Image and Sentence Matching via Aligned Cross-Modal Memory",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "6",
MONTH = "June",
PAGES = "2968-2983",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245459"}
@inproceedings{bb250625,
AUTHOR = "Huang, Y. and Wang, L.",
TITLE = "ACMM: Aligned Cross-Modal Memory for Few-Shot Image and Sentence
Matching",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "5773-5782",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245460"}
@article{bb250626,
AUTHOR = "Xu, X. and Lin, K.Y. and Yang, Y. and Hanjalic, A. and Shen, H.T.",
TITLE = "Joint Feature Synthesis and Embedding:
Adversarial Cross-Modal Retrieval Revisited",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "6",
MONTH = "June",
PAGES = "3030-3047",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245461"}
@article{bb250627,
AUTHOR = "Hamroun, M. and Tamine, K. and Crespin, B.",
TITLE = "Multimodal Video Indexing (MVI): A New Method Based on Machine Learning
and Semi-Automatic Annotation on Large Video Collections",
JOURNAL = IJIG,
VOLUME = "22",
YEAR = "2022",
NUMBER = "2",
MONTH = "April",
PAGES = "2250022",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245462"}
@article{bb250628,
AUTHOR = "Parida, K.K. and Sharma, G.",
TITLE = "Discriminative semantic transitive consistency for cross-modal
learning",
JOURNAL = CVIU,
VOLUME = "219",
YEAR = "2022",
PAGES = "103404",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245463"}
@article{bb250629,
AUTHOR = "Song, X. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.",
TITLE = "Spatial-Temporal Graphs for Cross-Modal Text2Video Retrieval",
JOURNAL = MultMed,
VOLUME = "24",
YEAR = "2022",
PAGES = "2914-2923",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245464"}
@article{bb250630,
AUTHOR = "Ma, X.H. and Yang, X.S. and Gao, J.Y. and Xu, C.S.",
TITLE = "The Model May Fit You: User-Generalized Cross-Modal Retrieval",
JOURNAL = MultMed,
VOLUME = "24",
YEAR = "2022",
PAGES = "2998-3012",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245465"}
@article{bb250631,
AUTHOR = "Shan, W. and Huang, D. and Wang, J.T. and Zou, F. and Li, S.",
TITLE = "Self-Attention based fine-grained cross-media hybrid network",
JOURNAL = PR,
VOLUME = "130",
YEAR = "2022",
PAGES = "108748",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245466"}
@article{bb250632,
AUTHOR = "Qian, S.S. and Xue, D.Z. and Fang, Q. and Xu, C.S.",
TITLE = "Adaptive Label-Aware Graph Convolutional Networks for Cross-Modal
Retrieval",
JOURNAL = MultMed,
VOLUME = "24",
YEAR = "2022",
PAGES = "3520-3532",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245467"}
@article{bb250633,
AUTHOR = "Wang, Y. and Peng, Y.X.",
TITLE = "MARS: Learning Modality-Agnostic Representation for Scalable
Cross-Media Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "7",
MONTH = "July",
PAGES = "4765-4777",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245468"}
@article{bb250634,
AUTHOR = "Liu, G.H. and Li, Z.Y. and Yang, J.Y. and Zhang, D.",
TITLE = "Exploiting sublimated deep features for image retrieval",
JOURNAL = PR,
VOLUME = "147",
YEAR = "2024",
PAGES = "110076",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245469"}
@article{bb250635,
AUTHOR = "Liu, G.H. and Li, Z.Y. and Zhang, D.",
TITLE = "Exploiting Hu invariant moments and deep features for image retrieval",
JOURNAL = PR,
VOLUME = "173",
YEAR = "2026",
PAGES = "112801",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245470"}
@article{bb250636,
AUTHOR = "Liu, Z. and Zhao, F.Y. and Zhang, M.M.",
TITLE = "An Efficient Multimodal Aggregation Network for Video-Text Retrieval",
JOURNAL = IEICE,
VOLUME = "E105-D",
YEAR = "2022",
NUMBER = "10",
MONTH = "October",
PAGES = "1825-1828",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245471"}
@article{bb250637,
AUTHOR = "Guo, D.J. and Su, X.M. and Lian, Y. and Liu, L.M. and Wang, H.B.",
TITLE = "Two-stage partial image-text clustering (TPIT-C)",
JOURNAL = IET-CV,
VOLUME = "16",
YEAR = "2022",
NUMBER = "8",
PAGES = "694-708",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245472"}
@article{bb250638,
AUTHOR = "Jin, M. and Zhang, H.X. and Zhu, L. and Sun, J.D. and Liu, L.",
TITLE = "Video Sampled Frame Category Aggregation and Consistent
Representation for Cross-Modal Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "2",
MONTH = "February",
PAGES = "909-919",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245473"}
@article{bb250639,
AUTHOR = "Liao, L. and Yang, M. and Zhang, B.",
TITLE = "Deep Supervised Dual Cycle Adversarial Network for Cross-Modal
Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "2",
MONTH = "February",
PAGES = "920-934",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245474"}
@article{bb250640,
AUTHOR = "Gong, Y. and Cosma, G.",
TITLE = "Improving visual-semantic embeddings by learning
semantically-enhanced hard negatives for cross-modal information
retrieval",
JOURNAL = PR,
VOLUME = "137",
YEAR = "2023",
PAGES = "109272",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245475"}
@article{bb250641,
AUTHOR = "Li, W.H. and Wang, Y. and Su, Y.T. and Li, X.Y. and Liu, A.A. and Zhang, Y.D.",
TITLE = "Multi-Scale Fine-Grained Alignments for Image and Sentence Matching",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "543-556",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245476"}
@article{bb250642,
AUTHOR = "Hu, P. and Huang, Z.Y. and Peng, D.Z. and Wang, X. and Peng, X.",
TITLE = "Cross-Modal Retrieval With Partially Mismatched Pairs",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "8",
MONTH = "August",
PAGES = "9595-9610",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245477"}
@article{bb250643,
AUTHOR = "Liu, Y.X. and Wu, J.L. and Qu, L. and Gan, T. and Yin, J.H. and Nie, L.Q.",
TITLE = "Self-Supervised Correlation Learning for Cross-Modal Retrieval",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "2851-2863",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245478"}
@article{bb250644,
AUTHOR = "Sun, C. and Zhang, H.X. and Liu, L. and Liu, D.M. and Wang, L.",
TITLE = "Multi-Label Adversarial Fine-Grained Cross-Modal Retrieval",
JOURNAL = SP:IC,
VOLUME = "117",
YEAR = "2023",
PAGES = "117018",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245479"}
@article{bb250645,
AUTHOR = "Guo, S.T. and Zhang, H.X. and Liu, L. and Liu, D.M. and Lu, X. and Li, L.J.",
TITLE = "Hypergraph clustering based multi-label cross-modal retrieval",
JOURNAL = JVCIR,
VOLUME = "103",
YEAR = "2024",
PAGES = "104258",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245480"}
@article{bb250646,
AUTHOR = "Song, D. and Ling, Y.T. and Li, T. and Wang, T. and Li, X.Y.",
TITLE = "Hierarchical deep semantic alignment for cross-domain 3D model
retrieval",
JOURNAL = JVCIR,
VOLUME = "95",
YEAR = "2023",
PAGES = "103895",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245481"}
@article{bb250647,
AUTHOR = "Li, T.B. and Liu, A.A. and Song, D. and Li, W.H. and Li, X.Y. and Su, Y.T.",
TITLE = "Focus on Hard Samples: Hierarchical Unbiased Constraints for
Cross-Domain 3D Model Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "11",
MONTH = "November",
PAGES = "7036-7049",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245482"}
@article{bb250648,
AUTHOR = "Dong, X. and Zhan, X.L. and Wei, Y.C. and Wei, X.Y. and Wang, Y.W. and Lu, M.L. and Cao, X.C. and Liang, X.D.",
TITLE = "Entity-Graph Enhanced Cross-Modal Pretraining for Instance-Level
Product Retrieval",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "11",
MONTH = "November",
PAGES = "13117-13133",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245483"}
@inproceedings{bb250649,
AUTHOR = "Zhan, X.L. and Wu, Y.X. and Dong, X. and Wei, Y.C. and Lu, M.L. and Zhang, Y.C. and Xu, H. and Liang, X.D.",
TITLE = "Product1M: Towards Weakly Supervised Instance-Level Product Retrieval
via Cross-Modal Pretraining",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "11762-11771",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245484"}
@article{bb250650,
AUTHOR = "Zhang, X. and Li, W.P. and Wang, X. and Wang, L. and Zheng, F.Z. and Wang, L. and Zhang, H.",
TITLE = "A Fusion Encoder with Multi-Task Guidance for Cross-Modal Text-Image
Retrieval in Remote Sensing",
JOURNAL = RS,
VOLUME = "15",
YEAR = "2023",
NUMBER = "18",
PAGES = "4637",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245485"}
@article{bb250651,
AUTHOR = "Xu, L.X. and Wang, L. and Zhang, J.Z. and Ha, D. and Zhang, H.",
TITLE = "A Review of Cross-Modal Image-Text Retrieval in Remote Sensing",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "24",
PAGES = "3995",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245486"}
@article{bb250652,
AUTHOR = "Ye, Z.S. and Yao, L. and Zhang, Y. and Gustin, S.",
TITLE = "Self-supervised cross-modal visual retrieval from brain activities",
JOURNAL = PR,
VOLUME = "145",
YEAR = "2024",
PAGES = "109915",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245487"}
@article{bb250653,
AUTHOR = "Chen, Z.J. and Zhang, Y. and Mi, S.",
TITLE = "Assisting Multimodal Named Entity Recognition by cross-modal
auxiliary tasks",
JOURNAL = PRL,
VOLUME = "175",
YEAR = "2023",
PAGES = "52-58",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245488"}
@article{bb250654,
AUTHOR = "Li, Z.X. and Zhao, W.Z. and Du, X.Y. and Zhou, G.Y. and Zhang, S.L.",
TITLE = "Cross-Modal Retrieval and Semantic Refinement for Remote Sensing
Image Captioning",
JOURNAL = RS,
VOLUME = "16",
YEAR = "2024",
NUMBER = "1",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245489"}
@article{bb250655,
AUTHOR = "Xu, R.Q. and Mayer, W. and Chu, H.L. and Zhang, Y. and Zhang, H.Y. and Wang, Y.L. and Liu, Y. and Feng, Z.",
TITLE = "Automatic semantic modeling of structured data sources with
cross-modal retrieval",
JOURNAL = PRL,
VOLUME = "177",
YEAR = "2024",
PAGES = "7-14",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245490"}
@article{bb250656,
AUTHOR = "Okamura, D. and Harakawa, R. and Iwahashi, M.",
TITLE = "LCNME: Label Correction Using Network Prediction Based on
Memorization Effects for Cross-Modal Retrieval With Noisy Labels",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "1",
MONTH = "January",
PAGES = "590-602",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245491"}
@article{bb250657,
AUTHOR = "Zhang, L. and Chen, L. and Zhou, C. and Li, X. and Yang, F. and Yi, Z.",
TITLE = "Weighted Graph-Structured Semantics Constraint Network for
Cross-Modal Retrieval",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "1551-1564",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245492"}
@article{bb250658,
AUTHOR = "Wang, Y.B. and Wang, S.H. and Luo, H. and Dong, J.F. and Wang, F. and Han, M. and Wang, X. and Wang, M.",
TITLE = "Dual-View Curricular Optimal Transport for Cross-Lingual Cross-Modal
Retrieval",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "1522-1533",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245493"}
@article{bb250659,
AUTHOR = "Zhang, H. and Li, Y.D. and Li, X.L.",
TITLE = "Constrained Bipartite Graph Learning for Imbalanced Multi-Modal
Retrieval",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "4502-4514",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245494"}
@article{bb250660,
AUTHOR = "Wang, Z. and Xu, X. and Wei, J. and Xie, N. and Yang, Y. and Shen, H.T.",
TITLE = "Semantics Disentangling for Cross-Modal Retrieval",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "2226-2237",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245495"}
@article{bb250661,
AUTHOR = "Ma, X.R. and Yang, M.X. and Li, Y.F. and Hu, P. and Lv, J.C. and Peng, X.",
TITLE = "Cross-Modal Retrieval With Noisy Correspondence via Consistency
Refining and Mining",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "2587-2598",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245496"}
@inproceedings{bb250662,
AUTHOR = "Feng, Y.L. and Zhu, H.Y. and Peng, D.Z. and Peng, X. and Hu, P.",
TITLE = "RONO: Robust Discriminative Learning with Noisy Labels for 2D-3D
Cross-Modal Retrieval",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "11610-11619",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245497"}
@inproceedings{bb250663,
AUTHOR = "Hu, P. and Peng, X. and Zhu, H.Y. and Zhen, L.L. and Lin, J.",
TITLE = "Learning Cross-Modal Retrieval with Noisy Labels",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "5399-5409",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245498"}
@article{bb250664,
AUTHOR = "Ji, Z. and Lin, Z.G. and Wang, H.R. and Pang, Y.W. and Li, X.L.",
TITLE = "Multi-task hierarchical convolutional network for visual-semantic
cross-modal retrieval",
JOURNAL = PR,
VOLUME = "151",
YEAR = "2024",
PAGES = "110398",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245499"}
@article{bb250665,
AUTHOR = "Ji, Z. and Li, Z.H. and Zhang, Y. and Pang, Y.W. and Li, X.L.",
TITLE = "Visual Semantic Contextualization Network for Multi-Query Image
Retrieval",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "7067-7080",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245500"}
@article{bb250666,
AUTHOR = "Pang, S.M. and Zeng, Y.Y. and Zhao, J.W. and Xue, J.R.",
TITLE = "A Mutually Textual and Visual Refinement Network for Image-Text
Matching",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "7555-7566",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245501"}
@article{bb250667,
AUTHOR = "Yang, D.K. and Kuang, H.P. and Yang, K. and Li, M.C. and Zhang, L.H.",
TITLE = "Towards Asynchronous Multimodal Signal Interaction and Fusion via
Tailored Transformers",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "1550-1554",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245502"}
@article{bb250668,
AUTHOR = "Hou, Y.L. and Zhong, X.J. and Cao, H. and Zhu, Z. and Zhou, Y.F. and Zhang, J.",
TITLE = "A shared-private sentiment analysis approach based on cross-modal
information interaction",
JOURNAL = PRL,
VOLUME = "183",
YEAR = "2024",
PAGES = "140-146",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245503"}
@article{bb250669,
AUTHOR = "Chen, S.W. and Liu, S. and Liu, J.",
TITLE = "Type-Specific Modality Alignment for Multi-Modal Information
Extraction",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "1525-1529",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245504"}
@article{bb250670,
AUTHOR = "Zheng, Z.Q. and Ren, H. and Wu, Y. and Zhang, W.C. and Lu, H. and Yang, Y. and Shen, H.T.",
TITLE = "Fully Unsupervised Domain-Agnostic Image Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "6",
MONTH = "June",
PAGES = "5077-5090",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245505"}
@article{bb250671,
AUTHOR = "Zhang, J.Z. and Wang, L. and Zheng, F.Z. and Wang, X. and Zhang, H.",
TITLE = "An Enhanced Feature Extraction Framework for Cross-Modal Image-Text
Retrieval",
JOURNAL = RS,
VOLUME = "16",
YEAR = "2024",
NUMBER = "12",
PAGES = "2201",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245506"}
@article{bb250672,
AUTHOR = "Cheng, Q.R. and Tan, Z.S. and Wen, K.Y. and Chen, C. and Gu, X.D.",
TITLE = "Semantic Pre-Alignment and Ranking Learning With Unified Framework
for Cross-Modal Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "7",
MONTH = "July",
PAGES = "6503-6516",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245507"}
@article{bb250673,
AUTHOR = "Xue, P. and Niu, S.",
TITLE = "A novel active contour model based on features for image segmentation",
JOURNAL = PR,
VOLUME = "155",
YEAR = "2024",
PAGES = "110673",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245508"}
@article{bb250674,
AUTHOR = "Yan, J. and Deng, C. and Huang, H. and Liu, W.",
TITLE = "Causality-Invariant Interactive Mining for Cross-Modal Similarity
Learning",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "9",
MONTH = "September",
PAGES = "6216-6230",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245509"}
@article{bb250675,
AUTHOR = "Wu, W.J. and Zhao, Y.Z. and Li, Z. and Li, J.H. and Zhou, H. and Shou, M.Z. and Bai, X.",
TITLE = "A large cross-modal video retrieval dataset with reading
comprehension",
JOURNAL = PR,
VOLUME = "157",
YEAR = "2025",
PAGES = "110818",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245510"}
@article{bb250676,
AUTHOR = "Yuan, Z. and Wu, D. and Zhou, L.",
TITLE = "Achieving the Optimum Rate for Cross-Modal Source Coding",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "9722-9735",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245511"}
@article{bb250677,
AUTHOR = "Chen, R. and Tan, J.P. and Yang, Z.J. and Yang, X.J. and Dai, Q.Y. and Cheng, Y.Q. and Lin, L.",
TITLE = "DPHANet: Discriminative Parallel and Hierarchical Attention Network
for Natural Language Video Localization",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "9575-9590",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245512"}
@article{bb250678,
AUTHOR = "Zheng, A. and Yuan, F. and Zhang, H.C. and Wang, J.X. and Tang, C. and Li, C.L.",
TITLE = "Public-Private Attributes-Based Variational Adversarial Network for
Audio-Visual Cross-Modal Matching",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "9",
MONTH = "September",
PAGES = "8698-8709",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245513"}
@article{bb250679,
AUTHOR = "Li, D. and Du, S.L.",
TITLE = "ContextMatcher: Detector-Free Feature Matching With Cross-Modality
Context",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "9",
MONTH = "September",
PAGES = "7922-7934",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245514"}
@article{bb250680,
AUTHOR = "Zhang, F. and Zhou, H. and Hua, X.S. and Chen, C. and Luo, X.",
TITLE = "HOPE: A Hierarchical Perspective for Semi-Supervised 2D-3D
Cross-Modal Retrieval",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "12",
MONTH = "December",
PAGES = "8976-8993",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245515"}
@article{bb250681,
AUTHOR = "Zhu, Y. and Wu, Y. and Sebe, N. and Yan, Y.",
TITLE = "Vision + X: A Survey on Multimodal Learning in the Light of Data",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "12",
MONTH = "December",
PAGES = "9102-9122",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245516"}
@article{bb250682,
AUTHOR = "Li, Z. and Guo, C. and Wang, X. and Zhang, H. and Hu, L.",
TITLE = "Multi-View Visual Semantic Embedding for Cross-Modal Image-Text
Retrieval",
JOURNAL = PR,
VOLUME = "159",
YEAR = "2025",
PAGES = "111088",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245517"}
@article{bb250683,
AUTHOR = "Jin, M. and Hu, W.B. and Zhu, L. and Wang, X. and Hong, R.C.",
TITLE = "Based on Spatial and Temporal Implicit Semantic Relational Inference
for Cross-Modal Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "11",
MONTH = "November",
PAGES = "11286-11298",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245518"}
@article{bb250684,
AUTHOR = "Croitoru, I. and Bogolin, S.V. and Leordeanu, M. and Jin, H.L. and Zisserman, A. and Liu, Y. and Albanie, S.",
TITLE = "TeachText: CrossModal text-video retrieval through generalized
distillation",
JOURNAL = AI,
VOLUME = "338",
YEAR = "2025",
PAGES = "104235",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245519"}
@inproceedings{bb250685,
AUTHOR = "Croitoru, I. and Bogolin, S.V. and Leordeanu, M. and Jin, H.L. and Zisserman, A. and Albanie, S. and Liu, Y.",
TITLE = "TeachText:
CrossModal Generalized Distillation for Text-Video Retrieval",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "11563-11573",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245520"}
@article{bb250686,
AUTHOR = "Wang, T.S. and Li, F.L. and Zhu, L. and Li, J.J. and Zhang, Z. and Shen, H.T.",
TITLE = "Cross-Modal Retrieval: A Systematic Review of Methods and Future
Directions",
JOURNAL = PIEEE,
VOLUME = "112",
YEAR = "2024",
NUMBER = "11",
MONTH = "November",
PAGES = "1716-1754",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245521"}
@article{bb250687,
AUTHOR = "Luo, J.Y. and Zhao, Y.S. and Luo, X. and Xiao, Z.P. and Ju, W. and Shen, L. and Tao, D.C. and Zhang, M.",
TITLE = "Cross-Domain Diffusion With Progressive Alignment for Efficient
Adaptive Retrieval",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "1820-1834",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245522"}
@article{bb250688,
AUTHOR = "Zhang, H.W. and Yang, Y. and Qi, F. and Qian, S.S. and Xu, C.S.",
TITLE = "Active Supervised Cross-Modal Retrieval",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "6",
MONTH = "June",
PAGES = "5112-5126",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245523"}
@article{bb250689,
AUTHOR = "Dang, Z.H. and Luo, M. and Wang, J.H. and Jia, C.Y. and Han, H.C. and Wan, H. and Dai, G. and Chang, X.J. and Wang, J.D.",
TITLE = "Disentangled Noisy Correspondence Learning",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "2602-2615",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245524"}
@article{bb250690,
AUTHOR = "Si, L. and Guo, C. and Li, Z. and Yang, Y.",
TITLE = "A unified framework of data augmentation using large language models
for text-based cross-modal retrieval",
JOURNAL = PR,
VOLUME = "167",
YEAR = "2025",
PAGES = "111755",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245525"}
@article{bb250691,
AUTHOR = "Jin, M. and Hu, W.B. and Hong, R.C. and Zhu, L.",
TITLE = "Revealing Security Flaws in Cross-Modal Retrieval Models Through
Video Poisoning",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "6",
MONTH = "June",
PAGES = "6184-6194",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245526"}
@article{bb250692,
AUTHOR = "Li, Y. and Deng, S. and Guan, C.M. and Gao, J.",
TITLE = "Complementary two-branch Transformer for multi-label image retrieval",
JOURNAL = PR,
VOLUME = "168",
YEAR = "2025",
PAGES = "111806",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245527"}
@article{bb250693,
AUTHOR = "Zheng, C.Y. and Li, X. and Liang, X.Y. and Huang, L. and Du, S. and Nie, J. and Dong, J.Y.",
TITLE = "Cross-Modal Progressive Perspective Matching Network for Remote
Sensing Image-Text Retrieval",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "3966-3978",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245528"}
@article{bb250694,
AUTHOR = "Pu, R. and Qin, Y. and Peng, D.Z. and Song, X.M. and Zheng, H.M.",
TITLE = "Deep Reversible Consistency Learning for Cross-Modal Retrieval",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "4095-4106",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245529"}
@article{bb250695,
AUTHOR = "Xu, Y. and Feng, Y.F. and Zhong, X. and Gao, Y. and Wu, Z.Z.",
TITLE = "Hypergraph-Based Remaining Prototype Alignment for Open-Set
Cross-Domain Image Retrieval",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "4627-4642",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245530"}
@article{bb250696,
AUTHOR = "Jiang, C. and Wang, Y.P. and Xiong, B.P.",
TITLE = "Dual similarity enhanced hybrid orthogonal fusion for multimodal
named entity recognition",
JOURNAL = PR,
VOLUME = "169",
YEAR = "2026",
PAGES = "111940",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245531"}
@article{bb250697,
AUTHOR = "Wang, Z. and Zhu, X.Z. and Yang, X. and Luo, G. and Li, H. and Tian, C.Y. and Dou, W.H. and Ge, J.Q. and Lu, L.W. and Qiao, Y. and Dai, J.F.",
TITLE = "Parameter-Inverted Image Pyramid Networks for Visual Perception and
Multimodal Understanding",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "10142-10159",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245532"}
@article{bb250698,
AUTHOR = "Jin, M. and Zhu, L. and Hong, R.C.",
TITLE = "BiSeR-LMA: A Bidirectional Semantic Reasoning and Large Model
Enhancement Approach for Text-Video Cross-Modal Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "11655-11666",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245533"}
@article{bb250699,
AUTHOR = "Jin, M. and Zhang, H.X. and Zhu, L. and Sun, J. and Liu, L.",
TITLE = "Video and text semantic center alignment for text-video cross-modal
retrieval",
JOURNAL = SP:IC,
VOLUME = "140",
YEAR = "2026",
PAGES = "117413",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat830cm1.html#TT245534"}
Last update:Mar 28, 2026 at 17:09:41