@article{bb114000,
        AUTHOR = "Saidi, S. and Idbraim, S. and Karmoude, Y. and Masse, A. and Arbelo, M.",
        TITLE = "Deep-Learning for Change Detection Using Multi-Modal Fusion of Remote
Sensing Images: A Review",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "20",
        PAGES = "3852",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110632"}

@article{bb114001,
        AUTHOR = "Liu, Y.Y. and He, W. and Zhang, H.Y.",
        TITLE = "GRiD: Guided Refinement for Detector-Free Multimodal Image Matching",
        JOURNAL = IP,
        VOLUME = "33",
        YEAR = "2024",
        PAGES = "5892-5906",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110633"}

@article{bb114002,
        AUTHOR = "Wang, J.P. and Su, N. and Zhao, C.H. and Yan, Y.M. and Feng, S.",
        TITLE = "Multi-Modal Object Detection Method Based on Dual-Branch Asymmetric
Attention Backbone and Feature Fusion Pyramid Network",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "20",
        PAGES = "3904",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110634"}

@article{bb114003,
        AUTHOR = "Liu, Y. and Liu, F. and Jiao, L.C. and Bao, Q.Y. and Sun, L. and Li, S. and Li, L.L. and Liu, X.",
        TITLE = "Multi-Grained Gradual Inference Model for Multimedia Event Extraction",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "10507-10520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110635"}

@article{bb114004,
        AUTHOR = "Wang, X.X. and Fang, L.X. and Zhao, J.L. and Pan, Z.K. and Li, H. and Li, Y.",
        TITLE = "MMAE: A universal image fusion method via mask attention mechanism",
        JOURNAL = PR,
        VOLUME = "158",
        YEAR = "2025",
        PAGES = "111041",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110636"}

@article{bb114005,
        AUTHOR = "Zhang, D. and Bashar, M.A. and Nayak, R.",
        TITLE = "A novel multi-modal fusion method based on uncertainty-guided
meta-learning",
        JOURNAL = PR,
        VOLUME = "158",
        YEAR = "2025",
        PAGES = "110993",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110637"}

@article{bb114006,
        AUTHOR = "Lv, T. and Ji, C.M. and Jiang, H. and Liu, Y.",
        TITLE = "HF2TNet: A Hierarchical Fusion Two-Stage Training Network for
Infrared and Visible Image Fusion",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "3164-3168",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110638"}

@article{bb114007,
        AUTHOR = "Meng, X.C. and Chen, C.Q. and Liu, Q. and Shao, F.",
        TITLE = "Multi-domain pseudo-reference quality evaluation for infrared and
visible image fusion",
        JOURNAL = IET-IPR,
        VOLUME = "18",
        YEAR = "2024",
        NUMBER = "13",
        PAGES = "4095-4113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110639"}

@article{bb114008,
        AUTHOR = "Bai, Y. and Gao, M. and Li, S.Y. and Wang, P. and Guan, N. and Yin, H.Z. and Yan, Y.H.",
        TITLE = "IBFusion: An Infrared and Visible Image Fusion Method Based on
Infrared Target Mask and Bimodal Feature Extraction Strategy",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "10610-10622",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110640"}

@article{bb114009,
        AUTHOR = "Wang, X.X. and Fang, L.X. and Zhao, J.L. and Pan, Z.K. and Li, H. and Li, Y.",
        TITLE = "UUD-Fusion: An unsupervised universal image fusion approach via
generative diffusion model",
        JOURNAL = CVIU,
        VOLUME = "249",
        YEAR = "2024",
        PAGES = "104218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110641"}

@article{bb114010,
        AUTHOR = "Dong, A. and Wang, L. and Liu, J. and Xu, J.Y. and Zhao, G.X. and Zhai, Y. and Lv, G.H. and Cheng, J.",
        TITLE = "Co-Enhancement of Multi-Modality Image Fusion and Object Detection
via Feature Adaptation",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12624-12637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110642"}

@article{bb114011,
        AUTHOR = "Wu, X. and Cao, Z.H. and Huang, T.Z. and Deng, L.J. and Chanussot, J. and Vivone, G.",
        TITLE = "Fully-Connected Transformer for Multi-Source Image Fusion",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "2071-2088",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110643"}

@article{bb114012,
        AUTHOR = "Cao, Z.H. and Liang, Y.J. and Deng, L.J. and Vivone, G.",
        TITLE = "An Efficient Image Fusion Network Exploiting Unifying Language and
Mask Guidance",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "9845-9862",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110644"}

@article{bb114013,
        AUTHOR = "Hussain, I. and Tan, S.Q. and Huang, J.W.",
        TITLE = "Few-Shot Based Learning Recaptured Image Detection with Multi-Scale
Feature Fusion and Attention",
        JOURNAL = PR,
        VOLUME = "161",
        YEAR = "2025",
        PAGES = "111248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110645"}

@article{bb114014,
        AUTHOR = "Tang, H. and Liu, D.W. and Shen, C.C.",
        TITLE = "Data-efficient multi-scale fusion vision transformer",
        JOURNAL = PR,
        VOLUME = "161",
        YEAR = "2025",
        PAGES = "111305",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110646"}

@article{bb114015,
        AUTHOR = "Liu, T.F. and Zhang, M.Y. and Gong, M. and Zhang, Q.F. and Jiang, F.L. and Zheng, H.H. and Lu, D.",
        TITLE = "Commonality Feature Representation Learning for Unsupervised
Multimodal Change Detection",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "1219-1233",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110647"}

@article{bb114016,
        AUTHOR = "Xu, J.J. and Liu, T.F. and Lei, T. and Chen, H.R.X. and Yokoya, N. and Lv, Z.Y. and Gong, M.",
        TITLE = "CGSL: Commonality graph structure learning for unsupervised
multimodal change detection",
        JOURNAL = PandRS,
        VOLUME = "229",
        YEAR = "2025",
        PAGES = "92-106",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110648"}

@article{bb114017,
        AUTHOR = "Liu, Z.W. and Cheng, J. and Fan, J. and Lin, S. and Wang, Y. and Zhao, X.M.",
        TITLE = "Multi-Modal Fusion Based on Depth Adaptive Mechanism for 3D Object
Detection",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "707-717",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110649"}

@article{bb114018,
        AUTHOR = "Dong, C. and Wang, L.Z. and Zhang, F. and Hua, Q.",
        TITLE = "Multi-modal Few-shot Image Recognition with enhanced semantic and
visual integration",
        JOURNAL = IVC,
        VOLUME = "157",
        YEAR = "2025",
        PAGES = "105490",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110650"}

@article{bb114019,
        AUTHOR = "Tang, L. and Liu, Y. and Tian, Y.J. and Pardalos, P.M.",
        TITLE = "Complementary label learning with multi-view data and a
semi-supervised labeling mechanism",
        JOURNAL = PR,
        VOLUME = "165",
        YEAR = "2025",
        PAGES = "111651",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110651"}

@article{bb114020,
        AUTHOR = "Zhou, M. and Huang, J. and Yan, K.Y. and Hong, D.F. and Jia, X.P. and Chanussot, J. and Li, C.Y.",
        TITLE = "A General Spatial-Frequency Learning Framework for Multimodal Image
Fusion",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "5281-5298",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110652"}

@article{bb114021,
        AUTHOR = "Wang, Z. and Zhao, L. and Zhang, J.Z. and Song, R. and Song, H.Y. and Meng, J. and Wang, S.D.",
        TITLE = "Multi-Text Guidance Is Important: Multi-Modality Image Fusion via Large
Generative Vision-Language Model",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4646-4668",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110653"}

@article{bb114022,
        AUTHOR = "Liu, Y. and Li, C.X. and Xu, S.K. and Han, J.G.",
        TITLE = "Part-Whole Relational Fusion Towards Multi-Modal Scene Understanding",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4483-4503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110654"}

@article{bb114023,
        AUTHOR = "Ravi, J. and Narmadha, R.",
        TITLE = "A Systematic Literature Review on Multimodal Image Fusion Models with
Challenges and Future Research Trends",
        JOURNAL = IJIG,
        VOLUME = "25",
        YEAR = "2025",
        NUMBER = "4",
        MONTH = "July",
        PAGES = "2550039",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110655"}

@article{bb114024,
        AUTHOR = "Liu, Y.P. and Sun, Z.C. and Yu, B.S. and Zhao, Y.T. and Du, B. and Xu, Y.C. and Cheng, J.",
        TITLE = "MIFNet: Learning Modality-Invariant Features for Generalizable
Multimodal Image Matching",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "3593-3608",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110656"}

@article{bb114025,
        AUTHOR = "Yang, Z. and Song, N. and Li, W. and Zhu, X.T. and Zhang, L. and Torr, P.H.S.",
        TITLE = "DeepInteraction++: Multi-Modality Interaction for Autonomous Driving",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6749-6763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110657"}

@article{bb114026,
        AUTHOR = "Lu, M. and Jiang, M. and Tao, X.F. and Kong, J.",
        TITLE = "AU-Net: Adaptive Unified Network for Joint Multi-Modal Image
Registration and Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "4721-4735",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110658"}

@article{bb114027,
        AUTHOR = "Wang, Q.H. and Li, Z.W. and Zhang, S.Q. and Chi, N. and Dai, Q.H.",
        TITLE = "WaveFusion: A Novel Wavelet Vision Transformer With Saliency-Guided
Enhancement for Multimodal Image Fusion",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "7526-7542",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110659"}

@article{bb114028,
        AUTHOR = "Liang, P.W. and Jiang, J.J. and Ma, Q. and Wang, C.Y. and Liu, X.M. and Ma, J.Y.",
        TITLE = "FusionINV: A Diffusion-Based Approach for Multimodal Image Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "5355-5368",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110660"}

@article{bb114029,
        AUTHOR = "Shi, L.T. and Zhong, B. and Liang, Q.H. and Hu, X.T. and Mo, Z.Y. and Song, S.X.",
        TITLE = "Mamba Adapter: Efficient Multi-Modal Fusion for Vision-Language
Tracking",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "9300-9311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110661"}

@article{bb114030,
        AUTHOR = "Liu, X.Y. and Ming, R. and Du, S.L. and He, L.H. and Luo, H.B. and Xiao, G.",
        TITLE = "HSENet: Hierarchical Semantic-Enriched Network for Multi-Modal Image
Fusion",
        JOURNAL = PR,
        VOLUME = "170",
        YEAR = "2026",
        PAGES = "112043",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110662"}

@article{bb114031,
        AUTHOR = "Zavras, A. and Michail, D. and Demir, B. and Papoutsis, I.",
        TITLE = "Mind the modality gap: Towards a remote sensing vision-language model
via cross-modal alignment",
        JOURNAL = PandRS,
        VOLUME = "228",
        YEAR = "2025",
        PAGES = "270-287",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110663"}

@article{bb114032,
        AUTHOR = "Cheng, T. and Chen, H. and Zhang, X.H. and Gao, X.W. and Yin, L. and Jiao, J.B.",
        TITLE = "Multi-Channel Spatio-Temporal Data Fusion of 'Big' and 'Small'
Network Data Using Transformer Networks",
        JOURNAL = IJGI,
        VOLUME = "14",
        YEAR = "2025",
        NUMBER = "8",
        PAGES = "286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110664"}

@article{bb114033,
        AUTHOR = "Hu, J.J. and Fan, C. and Ozay, M. and Gao, Q. and Guo, Y.L. and Lam, T.L.",
        TITLE = "Robust Depth Estimation Under Sensor Degradations:
A Multi-Sensor Fusion Perspective",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "8691-8707",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110665"}

@article{bb114034,
        AUTHOR = "Xin, J.W. and Shi, B. and Wang, N.N. and Li, J. and Gao, X.B.",
        TITLE = "MVFusion: Generative Representation Learning With Masked Variational
Autoencoders for Multi-Modality Image Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "6418-6431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110666"}

@article{bb114035,
        AUTHOR = "Zheng, T.H. and Dong, G.L. and Zhang, P.P. and He, X. and Ren, C.",
        TITLE = "Plug-and-Play General Image Registration for Misaligned Multi-Modal
Image Fusion",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "10017-10031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110667"}

@article{bb114036,
        AUTHOR = "Jiao, S.C. and Long, L. and Kuang, L.Q. and Xiong, F.G. and Han, X.",
        TITLE = "Multi-modal semantic embedding network for 3D shape recognition and
retrieval",
        JOURNAL = JVCIR,
        VOLUME = "112",
        YEAR = "2025",
        PAGES = "104559",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110668"}

@inproceedings{bb114037,
        AUTHOR = "Xue, F. and Elflein, S. and Leal Taixe, L. and Zhou, Q.",
        TITLE = "MATCHA: Towards Matching Anything",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "27081-27091",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110669"}

@inproceedings{bb114038,
        AUTHOR = "Shrivastava, A. and Owens, A.",
        TITLE = "Self-Supervised Spatial Correspondence Across Modalities",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "6383-6393",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110670"}

@inproceedings{bb114039,
        AUTHOR = "Zhou, B. and Li, L. and Wang, Y.J. and Liu, H.F. and Yao, Y.Z. and Wang, W.G.",
        TITLE = "UniAlign: Scaling Multimodal Alignment within One Unified Model",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29644-29655",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110671"}

@inproceedings{bb114040,
        AUTHOR = "Hou, J.M. and Chen, X.Y. and Ran, R. and Cong, X.F. and Liu, X.Y. and You, J.W. and Deng, L.J.",
        TITLE = "Binarized Neural Network for Multi-spectral Image Fusion",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "2236-2245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110672"}

@inproceedings{bb114041,
        AUTHOR = "Li, Y. and Xing, Y.F. and Lan, X.Y. and Li, X. and Chen, H.F. and Jiang, D.M.",
        TITLE = "AlignMamba: Enhancing Multimodal Mamba with Local and Global
Cross-Modal Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24774-24784",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110673"}

@inproceedings{bb114042,
        AUTHOR = "Maniparambil, M. and Akshulakov, R. and Djilali, Y.A.D. and Narayan, S. and Singh, A. and O'Connor, N.E.",
        TITLE = "Harnessing Frozen Unimodal Encoders for Flexible Multimodal Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29847-29857",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110674"}

@inproceedings{bb114043,
        AUTHOR = "Li, H. and Hou, Y.N. and Xing, X.H. and Ma, Y.X. and Sun, X. and Zhang, Y.",
        TITLE = "OccMamba: Semantic Occupancy Prediction with State Space Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "11949-11959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110675"}

@inproceedings{bb114044,
        AUTHOR = "Chen, L. and Wang, J. and Mortlock, T. and Khargonekar, P. and Faruque, M.A.A.",
        TITLE = "Hyperdimensional Uncertainty Quantification for Multimodal
Uncertainty Fusion in Autonomous Vehicles Perception",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "22306-22316",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110676"}

@inproceedings{bb114045,
        AUTHOR = "Wu, G.Y. and Liu, H.Y. and Fu, H.M. and Peng, Y.C. and Liu, J.Y. and Fan, X. and Liu, R.S.",
        TITLE = "Every SAM Drop Counts: Embracing Semantic Priors for Multi-Modality
Image Fusion and Beyond",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "17882-17891",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110677"}

@inproceedings{bb114046,
        AUTHOR = "Mei, S.B. and Ni, B.B. and Wang, H. and Zhao, C.L. and Hu, F. and Pi, Z.M. and Ke, B.",
        TITLE = "Object-Oriented Anchoring and Modal Alignment in Multimodal Learning",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "L: 179-196",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110678"}

@inproceedings{bb114047,
        AUTHOR = "Tran, Q.H. and Ahmed, M. and Popattia, M. and Ahmed, M.H. and Konin, A. and Zia, M.Z.",
        TITLE = "Learning by Aligning 2D Skeleton Sequences and Multi-Modality Fusion",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "L: 141-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110679"}

@inproceedings{bb114048,
        AUTHOR = "Li, C.X. and Liu, X.Y. and Wang, C. and Liu, Y.F. and Yu, W.H. and Shao, J. and Yuan, Y.X.",
        TITLE = "GTP-4O: Modality-prompted Heterogeneous Graph Learning for Omni-modal
Biomedical Representation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "IV: 168-187",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110680"}

@inproceedings{bb114049,
        AUTHOR = "Song, Z.Q. and Wang, L.F.",
        TITLE = "Dual Multi-Modal Feature Fusion Network for the Evaluation of
Osteosarcoma",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "2937-2943",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110681"}

@inproceedings{bb114050,
        AUTHOR = "Bahaduri, B. and Ming, Z.H. and Feng, F.C. and Mokraoui, A.",
        TITLE = "Multimodal Transformer Using Cross-Channel Attention for Object
Detection in Remote Sensing Images",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "2620-2626",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110682"}

@inproceedings{bb114051,
        AUTHOR = "Gao, Z.X. and Jiang, X. and Xu, X. and Shen, F.M. and Li, Y.J. and Shen, H.T.",
        TITLE = "Embracing Unimodal Aleatoric Uncertainty for Robust Multimodal Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "26866-26875",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110683"}

@inproceedings{bb114052,
        AUTHOR = "Jiang, H. and Karpur, A. and Cao, B. and Huang, Q.X. and Araujo, A.",
        TITLE = "OmniGlue: Generalizable Feature Matching with Foundation Model
Guidance",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "19865-19875",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110684"}

@inproceedings{bb114053,
        AUTHOR = "Yi, X.P. and Xu, H. and Zhang, H. and Tang, L.F. and Ma, J.Y.",
        TITLE = "Text-IF: Leveraging Semantic Text Guidance for Degradation-Aware and
Interactive Image Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "27016-27025",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110685"}

@inproceedings{bb114054,
        AUTHOR = "Vouitsis, N. and Liu, Z.Y. and Gorti, S.K. and Villecroze, V. and Cresswell, J.C. and Yu, G. and Loaiza Ganem, G. and Volkovs, M.",
        TITLE = "Data-Efficient Multimodal Fusion on a Single GPU",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "27229-27241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110686"}

@inproceedings{bb114055,
        AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Zhang, K. and Xu, S. and Chen, D.D. and Timofte, R. and Van Gool, L.J.",
        TITLE = "Equivariant Multi-Modality Image Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "25912-25921",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110687"}

@inproceedings{bb114056,
        AUTHOR = "Li, X. and Li, X.S. and Ye, T. and Cheng, X.Q. and Liu, W.Y. and Tan, H.",
        TITLE = "Bridging the Gap between Multi-focus and Multi-modal: A Focused
Integration Framework for Multi-modal Image Fusion",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "1617-1626",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110688"}

@inproceedings{bb114057,
        AUTHOR = "Han, K.Y. and Cao, F.Z. and Shi, T.X. and Wang, P.",
        TITLE = "A Dual Attention Network for Multimodal Remote Sensing Image Matching",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "128-134",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110689"}

@inproceedings{bb114058,
        AUTHOR = "Liu, B. and Xu, Z.Q. and Bao, X.L. and Zhong, Z.",
        TITLE = "MUNformer: A strong encoder that uses multi-level features extracted
by different feature extractors for fusion",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "291-295",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110690"}

@inproceedings{bb114059,
        AUTHOR = "He, C.M. and Li, K. and Xu, G.X. and Zhang, Y. and Hu, R.Z. and Guo, Z.H. and Li, X.",
        TITLE = "Degradation-Resistant Unfolding Network for Heterogeneous Image
Fusion",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "12577-12587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110691"}

@inproceedings{bb114060,
        AUTHOR = "Liu, J.Y. and Liu, Z. and Wu, G.Y. and Ma, L. and Liu, R.S. and Zhong, W. and Luo, Z.X. and Fan, X.",
        TITLE = "Multi-interactive Feature Learning and a Full-time Multi-modality
Benchmark for Image Fusion and Segmentation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "8081-8090",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110692"}

@inproceedings{bb114061,
        AUTHOR = "Sippel, F. and Seiler, J. and Kaup, A.",
        TITLE = "Cross Spectral Image Reconstruction Using a Deep Guided Neural
Network",
        BOOKTITLE = ICIP23,
        YEAR = "2023",
        PAGES = "226-230",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110693"}

@inproceedings{bb114062,
        AUTHOR = "Myers, A. and Kvinge, H. and Emerson, T.",
        TITLE = "TopFusion: Using Topological Feature Space for Fusion and Imputation
in Multi-Modal Data",
        BOOKTITLE = TAG-PRA23,
        YEAR = "2023",
        PAGES = "600-609",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110694"}

@inproceedings{bb114063,
        AUTHOR = "Xue, Z. and Marculescu, R.",
        TITLE = "Dynamic Multimodal Fusion",
        BOOKTITLE = MULA23,
        YEAR = "2023",
        PAGES = "2575-2584",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110695"}

@inproceedings{bb114064,
        AUTHOR = "Li, X. and Ma, T. and Hou, Y.N. and Shi, B. and Yang, Y.C. and Liu, Y. and Wu, X.J. and Chen, Q. and Li, Y.K. and Qiao, Y. and He, L.",
        TITLE = "LoGoNet: Towards Accurate 3D Object Detection with Local-to-Global
Cross-Modal Fusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "17524-17534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110696"}

@inproceedings{bb114065,
        AUTHOR = "Kong, L.K. and Qi, X.S. and Shen, Q.J. and Wang, J.C. and Zhang, J.Y. and Hu, Y. and Zhou, Q.C.",
        TITLE = "Indescribable Multi-Modal Spatial Evaluator",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "9853-9862",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110697"}

@inproceedings{bb114066,
        AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Xu, S. and Lin, Z. and Timofte, R. and Van Gool, L.J.",
        TITLE = "CDDFuse: Correlation-Driven Dual-Branch Feature Decomposition for
Multi-Modality Image Fusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "5906-5916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110698"}

@inproceedings{bb114067,
        AUTHOR = "Li, Y.W. and Quan, R.J. and Zhu, L.C. and Yang, Y.",
        TITLE = "Efficient Multimodal Fusion via Interactive Prompting",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "2604-2613",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110699"}

@inproceedings{bb114068,
        AUTHOR = "Wetzer, E. and Lindblad, J. and Sladoje, N.",
        TITLE = "Can Representation Learning for Multimodal Image Registration be
Improved by Supervision of Intermediate Layers?",
        BOOKTITLE = IbPRIA23,
        YEAR = "2023",
        PAGES = "261-275",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110700"}

@inproceedings{bb114069,
        AUTHOR = "Huang, Z.B. and Liu, J.Y. and Fan, X. and Liu, R.S. and Zhong, W. and Luo, Z.X.",
        TITLE = "ReCoNet: Recurrent Correction Network for Fast and Efficient
Multi-modality Image Fusion",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XVIII:539-555",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110701"}

@inproceedings{bb114070,
        AUTHOR = "Duan, J.L. and Chen, L.Q. and Tran, S. and Yang, J.Y. and Xu, Y. and Zeng, B. and Chilimbi, T.",
        TITLE = "Multi-modal Alignment using Representation Codebook",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "15630-15639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110702"}

@inproceedings{bb114071,
        AUTHOR = "Xue, Z.H. and Ren, S.C. and Gao, Z.Q. and Zhao, H.",
        TITLE = "Multimodal Knowledge Expansion",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "834-843",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110703"}

@inproceedings{bb114072,
        AUTHOR = "Zolfaghari, M. and Zhu, Y. and Gehler, P. and Brox, T.",
        TITLE = "CrossCLR: Cross-modal Contrastive Learning For Multi-modal Video
Representations",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "1430-1439",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110704"}

@inproceedings{bb114073,
        AUTHOR = "Piergiovanni, A.J. and Casser, V. and Ryoo, M.S. and Angelova, A.",
        TITLE = "4D-Net for Learned Multi-Modal Alignment",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "15415-15425",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110705"}

@inproceedings{bb114074,
        AUTHOR = "Yang, J.H. and Huang, Y. and Ma, Z.Y. and Wang, L.",
        TITLE = "CMF: Cascaded Multi-Model Fusion for Referring Image Segmentation",
        BOOKTITLE = ICIP21,
        YEAR = "2021",
        PAGES = "2289-2293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110706"}

@inproceedings{bb114075,
        AUTHOR = "Panda, R. and Chen, C.F.R. and Fan, Q.F. and Sun, X. and Saenko, K. and Oliva, A. and Feris, R.S.",
        TITLE = "AdaMML: Adaptive Multi-Modal Learning for Efficient Video Recognition",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "7556-7565",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110707"}

@inproceedings{bb114076,
        AUTHOR = "Shi, Z.S. and Liang, J. and Li, Q.Q. and Zheng, H.Y. and Gu, Z.R. and Dong, J.Y. and Zheng, B.",
        TITLE = "Multi-Modal Multi-Action Video Recognition",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "13658-13667",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110708"}

@inproceedings{bb114077,
        AUTHOR = "Huang, S.C. and Shen, L.Y. and Lungren, M.P. and Yeung, S.",
        TITLE = "GLoRIA: A Multimodal Global-Local Representation Learning Framework
for Label-efficient Medical Image Recognition",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "3922-3931",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110709"}

@inproceedings{bb114078,
        AUTHOR = "Chen, B. and Rouditchenko, A. and Duarte, K. and Kuehne, H. and Thomas, S. and Boggust, A. and Panda, R. and Kingsbury, B. and Feris, R.S. and Harwath, D. and Glass, J. and Picheny, M. and Chang, S.F.",
        TITLE = "Multimodal Clustering Networks for Self-supervised Learning from
Unlabeled Videos",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "7992-8001",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110710"}

@inproceedings{bb114079,
        AUTHOR = "Liang, T. and Lin, G.S. and Feng, L. and Zhang, Y. and Lv, F.M.",
        TITLE = "Attention is not Enough: Mitigating the Distribution Discrepancy in
Asynchronous Multimodal Sequence Fusion",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "8128-8136",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110711"}

@inproceedings{bb114080,
        AUTHOR = "Liu, Y.Z. and Fan, Q.N. and Zhang, S.H. and Dong, H. and Funkhouser, T. and Yi, L.",
        TITLE = "Contrastive Multimodal Fusion with TupleInfoNCE",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "734-743",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110712"}

@inproceedings{bb114081,
        AUTHOR = "Ouerghi, H. and Mourali, O. and Zagrouba, E.",
        TITLE = "Multi-modal Image Fusion Based on Weight Local Features and Novel
Sum-modified-laplacian in Non-subsampled Shearlet Transform Domain",
        BOOKTITLE = ISVC20,
        YEAR = "2020",
        PAGES = "II:166-179",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110713"}

@inproceedings{bb114082,
        AUTHOR = "Perez Rua, J.M. and Vielzeuf, V. and Pateux, S. and Baccouche, M. and Jurie, F.",
        TITLE = "MFAS: Multimodal Fusion Architecture Search",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6959-6968",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110714"}

@inproceedings{bb114083,
        AUTHOR = "Sun, S.H. and Hu, J. and Yao, M.Q. and Hu, J.R. and Yang, X.D. and Song, Q. and Wu, X.",
        TITLE = "Robust Multimodal Image Registration Using Deep Recurrent Reinforcement
Learning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "II:511-526",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110715"}

@inproceedings{bb114084,
        AUTHOR = "Vielzeuf, V. and Lechervy, A. and Pateux, S. and Jurie, F.",
        TITLE = "CentralNet: A Multilayer Approach for Multimodal Fusion",
        BOOKTITLE = MultLearnApp18,
        YEAR = "2018",
        PAGES = "VI:575-589",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110716"}

@inproceedings{bb114085,
        AUTHOR = "Son, C.H. and Zhang, X.P.",
        TITLE = "Multimodal fusion via a series of transfers for noise removal",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "530-534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110717"}

@inproceedings{bb114086,
        AUTHOR = "Shrivastava, A. and Rastegari, M. and Shekhar, S. and Chellappa, R. and Davis, L.S.",
        TITLE = "Class consistent multi-modal fusion with binary features",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "2282-2291",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110718"}

@inproceedings{bb114087,
        AUTHOR = "Kasiri, K. and Fieguth, P.W. and Clausi, D.A.",
        TITLE = "Self-similarity measure for multi-modal image registration",
        BOOKTITLE = ICIP16,
        YEAR = "2016",
        PAGES = "4498-4502",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110719"}

@inproceedings{bb114088,
        AUTHOR = "Kasiri, K. and Fieguth, P.W. and Clausi, D.A.",
        TITLE = "Structural Representations for Multi-modal Image Registration Based on
Modified Entropy",
        BOOKTITLE = ICIAR15,
        YEAR = "2015",
        PAGES = "82-89",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110720"}

@inproceedings{bb114089,
        AUTHOR = "Zhang, H. and Chen, L. and Liu, J. and Yuan, J.S.",
        TITLE = "Hierarchical multi-feature fusion for multimodal data analysis",
        BOOKTITLE = ICIP14,
        YEAR = "2014",
        PAGES = "5916-5920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110721"}

@inproceedings{bb114090,
        AUTHOR = "Shen, X.Y. and Xu, L. and Zhang, Q. and Jia, J.Y.",
        TITLE = "Multi-modal and Multi-spectral Registration for Natural Images",
        BOOKTITLE = ECCV14,
        YEAR = "2014",
        PAGES = "IV: 309-324",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110722"}

@inproceedings{bb114091,
        AUTHOR = "Sahoo, S. and Nanda, P.K. and Samant, S.",
        TITLE = "Tsallis and Renyi's embedded entropy based mutual information for
multimodal image registration",
        BOOKTITLE = NCVPRIPG13,
        YEAR = "2013",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110723"}

@inproceedings{bb114092,
        AUTHOR = "Kim, M.J. and Han, D.K. and Ko, H.S.",
        TITLE = "Multimodal image fusion via sparse representation with local patch
dictionaries",
        BOOKTITLE = ICIP13,
        YEAR = "2013",
        PAGES = "1301-1305",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110724"}

@inproceedings{bb114093,
        AUTHOR = "Glodek, M. and Schels, M. and Palm, G. and Schwenker, F.",
        TITLE = "Multi-modal Fusion based on classifiers using reject options and Markov
Fusion Networks",
        BOOKTITLE = ICPR12,
        YEAR = "2012",
        PAGES = "1084-1087",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110725"}

@inproceedings{bb114094,
        AUTHOR = "Forsberg, D. and Farneback, G. and Knutsson, H. and Westin, C.F.",
        TITLE = "Multi-modal Image Registration Using Polynomial Expansion and Mutual
Information",
        BOOKTITLE = WBIR12,
        YEAR = "2012",
        PAGES = "40-49",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110726"}

@inproceedings{bb114095,
        AUTHOR = "Bodensteiner, C. and Huebner, W. and Jueng Ling, K. and Mueller, J. and Arens, M.",
        TITLE = "Local multi-modal image matching based on self-similarity",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "937-940",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110727"}

@inproceedings{bb114096,
        AUTHOR = "Vegh, V. and Yang, Z.Y. and Tieng, Q.M. and Reutens, D.C.",
        TITLE = "Multimodal image registration using stochastic differential equation
optimization",
        BOOKTITLE = ICIP10,
        YEAR = "2010",
        PAGES = "4385-4388",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110728"}

@inproceedings{bb114097,
        AUTHOR = "Peng, T.Y. and Yigitsoy, M. and Eslami, A. and Bayer, C. and Navab, N.",
        TITLE = "Deformable Registration of Multi-modal Microscopic Images Using a
Pyramidal Interactive Registration-Learning Methodology",
        BOOKTITLE = WBIR14,
        YEAR = "2014",
        PAGES = "144-153",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110729"}

@inproceedings{bb114098,
        AUTHOR = "Wachinger, C. and Navab, N.",
        TITLE = "Manifold Learning for Multi-modal Image Registration",
        BOOKTITLE = BMVC10,
        YEAR = "2010",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110730"}

@inproceedings{bb114099,
        AUTHOR = "Xu, J. and Yuan, J.S. and Wu, Y.",
        TITLE = "Multimodal Partial Estimates Fusion",
        BOOKTITLE = ICCV09,
        YEAR = "2009",
        PAGES = "2177-2184",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT110731"}

Last update:Nov 26, 2025 at 20:24:09