@article{bb116700,
AUTHOR = "Lu, M. and Jiang, M. and Tao, X.F. and Kong, J.",
TITLE = "AU-Net: Adaptive Unified Network for Joint Multi-Modal Image
Registration and Fusion",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "4721-4735",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113289"}
@article{bb116701,
AUTHOR = "Wang, Q.H. and Li, Z.W. and Zhang, S.Q. and Chi, N. and Dai, Q.H.",
TITLE = "WaveFusion: A Novel Wavelet Vision Transformer With Saliency-Guided
Enhancement for Multimodal Image Fusion",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "8",
MONTH = "August",
PAGES = "7526-7542",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113290"}
@article{bb116702,
AUTHOR = "Liang, P.W. and Jiang, J.J. and Ma, Q. and Wang, C.Y. and Liu, X.M. and Ma, J.Y.",
TITLE = "FusionINV: A Diffusion-Based Approach for Multimodal Image Fusion",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "5355-5368",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113291"}
@article{bb116703,
AUTHOR = "Shi, L.T. and Zhong, B. and Liang, Q.H. and Hu, X.T. and Mo, Z.Y. and Song, S.X.",
TITLE = "Mamba Adapter: Efficient Multi-Modal Fusion for Vision-Language
Tracking",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "9",
MONTH = "September",
PAGES = "9300-9311",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113292"}
@article{bb116704,
AUTHOR = "Liu, X.Y. and Ming, R. and Du, S.L. and He, L.H. and Luo, H.B. and Xiao, G.",
TITLE = "HSENet: Hierarchical Semantic-Enriched Network for Multi-Modal Image
Fusion",
JOURNAL = PR,
VOLUME = "170",
YEAR = "2026",
PAGES = "112043",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113293"}
@article{bb116705,
AUTHOR = "Zavras, A. and Michail, D. and Demir, B. and Papoutsis, I.",
TITLE = "Mind the modality gap: Towards a remote sensing vision-language model
via cross-modal alignment",
JOURNAL = PandRS,
VOLUME = "228",
YEAR = "2025",
PAGES = "270-287",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113294"}
@article{bb116706,
AUTHOR = "Cheng, T. and Chen, H. and Zhang, X.H. and Gao, X.W. and Yin, L. and Jiao, J.B.",
TITLE = "Multi-Channel Spatio-Temporal Data Fusion of 'Big' and 'Small'
Network Data Using Transformer Networks",
JOURNAL = IJGI,
VOLUME = "14",
YEAR = "2025",
NUMBER = "8",
PAGES = "286",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113295"}
@article{bb116707,
AUTHOR = "Hu, J.J. and Fan, C. and Ozay, M. and Gao, Q. and Guo, Y.L. and Lam, T.L.",
TITLE = "Robust Depth Estimation Under Sensor Degradations:
A Multi-Sensor Fusion Perspective",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "10",
MONTH = "October",
PAGES = "8691-8707",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113296"}
@article{bb116708,
AUTHOR = "Xin, J.W. and Shi, B. and Wang, N.N. and Li, J. and Gao, X.B.",
TITLE = "MVFusion: Generative Representation Learning With Masked Variational
Autoencoders for Multi-Modality Image Fusion",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "6418-6431",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113297"}
@article{bb116709,
AUTHOR = "Zheng, T.H. and Dong, G.L. and Zhang, P.P. and He, X. and Ren, C.",
TITLE = "Plug-and-Play General Image Registration for Misaligned Multi-Modal
Image Fusion",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "10",
MONTH = "October",
PAGES = "10017-10031",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113298"}
@article{bb116710,
AUTHOR = "Jiao, S.C. and Long, L. and Kuang, L.Q. and Xiong, F.G. and Han, X.",
TITLE = "Multi-modal semantic embedding network for 3D shape recognition and
retrieval",
JOURNAL = JVCIR,
VOLUME = "112",
YEAR = "2025",
PAGES = "104559",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113299"}
@article{bb116711,
AUTHOR = "Sun, H. and Lv, L. and Zhang, P.P. and Tang, T.D. and Tian, F. and Sun, W.B. and Lu, H.C.",
TITLE = "Spatial-Frequency Enhanced Mamba for Multi-Modal Image Fusion",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "7684-7696",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113300"}
@article{bb116712,
AUTHOR = "Zhu, Y.X. and Lv, L. and Zhang, P.P. and Liu, X.H. and Tang, T.D. and Tian, F. and Sun, W.B. and Lu, H.C.",
TITLE = "Interactive Spatial-Frequency Fusion Mamba for Multi-Modal Image
Fusion",
JOURNAL = IP,
VOLUME = "35",
YEAR = "2026",
PAGES = "2380-2392",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113301"}
@article{bb116713,
AUTHOR = "Sun, Y.J. and Dong, W.S. and Wang, S. and Wu, P. and Feng, M.T. and Li, X. and Shi, G.M.",
TITLE = "Distilling Hierarchical Knowledge From Multimodal Fusion for Unimodal
Image Segmentation",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "12",
MONTH = "December",
PAGES = "11797-11809",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113302"}
@article{bb116714,
AUTHOR = "Yu, C.B. and Pei, Z.H. and Wang, X.R. and Zhou, H.B.",
TITLE = "CrossGlue: Cross-Modal Image matching via potential message
investigation and visual-gradient message integration",
JOURNAL = JVCIR,
VOLUME = "114",
YEAR = "2026",
PAGES = "104620",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113303"}
@article{bb116715,
AUTHOR = "Zhou, D.D. and Xu, L. and Wu, K. and Liu, H.Z. and Jiang, M.T.",
TITLE = "DSEPGAN: A Dual-Stream Enhanced Pyramid Based on Generative
Adversarial Network for Spatiotemporal Image Fusion",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "24",
PAGES = "4050",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113304"}
@article{bb116716,
AUTHOR = "Jiang, J.L. and Hu, G. and Sheng, G.L. and Wei, G.",
TITLE = "PSG-MCANet: Multi-order cross-attention modeling for multimodal
fusion based on punning semantic guidance",
JOURNAL = PR,
VOLUME = "172",
YEAR = "2026",
PAGES = "112723",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113305"}
@article{bb116717,
AUTHOR = "Li, M.Y. and Meng, C. and Fan, X.D.",
TITLE = "Iterative optimal transport for multimodal image registration",
JOURNAL = PR,
VOLUME = "172",
YEAR = "2026",
PAGES = "112736",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113306"}
@article{bb116718,
AUTHOR = "Wang, Y.X. and Shen, Z.W. and Li, H. and Zhang, Y.N. and Xia, Z.P.",
TITLE = "SGCNet: Silhouette Guided Cascaded Network for Multi-Modal Image
Fusion",
JOURNAL = CVIU,
VOLUME = "263",
YEAR = "2026",
PAGES = "104603",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113307"}
@article{bb116719,
AUTHOR = "He, D. and Wang, G.F. and Li, W.S. and Shu, Y.C. and Li, W.B. and Yang, L.J. and Huang, Y.P. and Li, F.Y.",
TITLE = "Rethinking normalization strategies and convolutional kernels for
multimodal image fusion",
JOURNAL = PR,
VOLUME = "173",
YEAR = "2026",
PAGES = "112903",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113308"}
@article{bb116720,
AUTHOR = "Li, S.T. and Tang, H.",
TITLE = "Multimodal Alignment and Fusion: A Survey",
JOURNAL = IJCV,
VOLUME = "134",
YEAR = "2026",
NUMBER = "1",
MONTH = "January",
PAGES = "103",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113309"}
@article{bb116721,
AUTHOR = "Fu, Y. and Ye, X. and Kong, X.Y.",
TITLE = "KPTFusion: Knowledge Prior-based Task-Driven Multimodal Image Fusion",
JOURNAL = IVC,
VOLUME = "167",
YEAR = "2026",
PAGES = "105886",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113310"}
@article{bb116722,
AUTHOR = "Qin, X.R. and Cui, Y.N. and Sun, S.Q. and Chen, R. and Ren, W.Q. and Knoll, A. and Cao, X.C.",
TITLE = "Disentangle to Fuse: Toward Content Preservation and Cross-Modality
Consistency for Multi-Modality Image Fusion",
JOURNAL = IP,
VOLUME = "35",
YEAR = "2026",
PAGES = "1756-1770",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113311"}
@article{bb116723,
AUTHOR = "Chen, H. and Zhou, H.R. and Zhang, Y. and Lin, Z. and Deng, Y.J.",
TITLE = "Dissecting RGB-D Learning for Improved Multi-Modal Fusion",
JOURNAL = IP,
VOLUME = "35",
YEAR = "2026",
PAGES = "1846-1857",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113312"}
@article{bb116724,
AUTHOR = "Zhang, J.J. and Zhao, F. and Liu, H.Q. and Yu, J.",
TITLE = "Generative Information-Guided Heterogeneous Cross-Fusion Network With
Contrastive Learning for Multimodal Remote Sensing Image
Classification",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "2",
MONTH = "February",
PAGES = "1876-1892",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113313"}
@article{bb116725,
AUTHOR = "Mutakabbir, A. and Lung, C.H. and Zaman, M. and Upadhyay, D. and Naik, K. and Millard, K. and Ravichandran, T. and Purcell, R.",
TITLE = "NOAH: A Multi-Modal and Sensor Fusion Dataset for Generative Modeling
in Remote Sensing",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "3",
PAGES = "466",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113314"}
@article{bb116726,
AUTHOR = "Rao, J.H. and Liu, R. and Guan, J.J. and Tian, X.",
TITLE = "AMS-Former: Adaptive multi-scale transformer for multi-modal image
matching",
JOURNAL = PandRS,
VOLUME = "232",
YEAR = "2026",
PAGES = "957-973",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113315"}
@article{bb116727,
AUTHOR = "Cao, J.Z. and Chen, J.S. and Wang, X.X. and Huang, W.M. and Chen, D.S. and Zhao, T.H. and Tu, W. and Li, Q.Q.",
TITLE = "UrbanMMCL: Urban region representations via multi-modal and
multi-graph self-supervised contrastive learning",
JOURNAL = PandRS,
VOLUME = "232",
YEAR = "2026",
PAGES = "75-93",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113316"}
@article{bb116728,
AUTHOR = "Ying, Z.H. and Guo, J. and Li, Y.S. and Gao, Y. and Li, C.Y.",
TITLE = "Diff-Transformer: Heterogeneous Feature Fusion Network for
Multisource Remote Sensing Classification",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "2",
MONTH = "February",
PAGES = "1501-1516",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113317"}
@article{bb116729,
AUTHOR = "Li, J.Y. and Jiang, C.J. and Jiang, J.J. and Liang, P.W. and Ma, J.Y. and Nie, L.Q.",
TITLE = "Towards Unified Semantic and Controllable Image Fusion: A Diffusion
Transformer Approach",
JOURNAL = PAMI,
VOLUME = "48",
YEAR = "2026",
NUMBER = "4",
MONTH = "April",
PAGES = "3970-3987",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113318"}
@article{bb116730,
AUTHOR = "Panda, G. and Kundu, S. and Bhattacharya, S. and Routray, A.",
TITLE = "L_0-Regularized Sparse Coding-Based Interpretable Network for
Multi-Modal Image Fusion",
JOURNAL = PAMI,
VOLUME = "48",
YEAR = "2026",
NUMBER = "4",
MONTH = "April",
PAGES = "4081-4097",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113319"}
@article{bb116731,
AUTHOR = "Kamara, A.A. and He, S. and Fofanah, A.J.",
TITLE = "FAMAFuse: Functional-Anatomical Multiscale Attention for Multimodal
Image Fusion",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "3",
MONTH = "March",
PAGES = "3215-3230",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113320"}
@article{bb116732,
AUTHOR = "Fan, J. and Bocus, M.J. and Shu, S.L.",
TITLE = "Embodied multi-modal data fusion via geometry anchoring for
continuous perception in ground robots",
JOURNAL = PRL,
VOLUME = "203",
YEAR = "2026",
PAGES = "162-169",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113321"}
@article{bb116733,
AUTHOR = "Zhang, L. and Yang, Y.G. and He, Z.S. and Li, G.L. and Zhao, F. and Hua, W.Q. and Xiao, G.W. and Zhang, J.Y.",
TITLE = "Multimodal Remote Sensing Image Classification Based on Dynamic Group
Convolution and Bidirectional Guided Cross-Attention Fusion",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "7",
PAGES = "1066",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113322"}
@article{bb116734,
AUTHOR = "Yu, M. and Lu, X. and Yang, Z. and Gao, D. and Zhong, G.Q.",
TITLE = "DAMFusion: Multi-Spectral Image Segmentation via Competitive Query
and Boundary Region Attention",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "7",
PAGES = "1064",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113323"}
@article{bb116735,
AUTHOR = "Yang, J. and Chung, H. and Jang, I.",
TITLE = "Hierarchical mutual distillation for multi-view fusion: Learning from
all possible view combinations",
JOURNAL = PR,
VOLUME = "178",
YEAR = "2026",
PAGES = "113432",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113324"}
@article{bb116736,
AUTHOR = "Pan, Y.J. and Shi, Y.C. and Yu, C. and Kong, X.Z. and Zhang, Y. and Xiao, N.",
TITLE = "Beyond a single perspective: A multi-agent debate framework for
affective computing",
JOURNAL = PR,
VOLUME = "178",
YEAR = "2026",
PAGES = "113445",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113325"}
@article{bb116737,
AUTHOR = "Yang, A. and Liu, B.Q. and Liu, M.Z. and Ding, H.H. and Mo, P.J. and Zhao, C.Q. and Liu, X.H. and Ye, T.",
TITLE = "RIF-Fuse: Invertible Frequency Decomposition with Residual
Enhancement for Robust Multimodal Fusion",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "10",
PAGES = "1520",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113326"}
@inproceedings{bb116738,
AUTHOR = "Xue, F. and Elflein, S. and Leal Taixe, L. and Zhou, Q.",
TITLE = "MATCHA: Towards Matching Anything",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "27081-27091",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113327"}
@inproceedings{bb116739,
AUTHOR = "Zhou, B. and Li, L. and Wang, Y.J. and Liu, H.F. and Yao, Y.Z. and Wang, W.G.",
TITLE = "UniAlign: Scaling Multimodal Alignment within One Unified Model",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "29644-29655",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113328"}
@inproceedings{bb116740,
AUTHOR = "Hou, J.M. and Chen, X.Y. and Ran, R. and Cong, X.F. and Liu, X.Y. and You, J.W. and Deng, L.J.",
TITLE = "Binarized Neural Network for Multi-spectral Image Fusion",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "2236-2245",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113329"}
@inproceedings{bb116741,
AUTHOR = "Li, Y. and Xing, Y.F. and Lan, X.Y. and Li, X. and Chen, H.F. and Jiang, D.M.",
TITLE = "AlignMamba: Enhancing Multimodal Mamba with Local and Global
Cross-Modal Alignment",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "24774-24784",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113330"}
@inproceedings{bb116742,
AUTHOR = "Maniparambil, M. and Akshulakov, R. and Djilali, Y.A.D. and Narayan, S. and Singh, A. and O'Connor, N.E.",
TITLE = "Harnessing Frozen Unimodal Encoders for Flexible Multimodal Alignment",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "29847-29857",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113331"}
@inproceedings{bb116743,
AUTHOR = "Li, H. and Hou, Y.N. and Xing, X.H. and Ma, Y.X. and Sun, X. and Zhang, Y.",
TITLE = "OccMamba: Semantic Occupancy Prediction with State Space Models",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "11949-11959",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113332"}
@inproceedings{bb116744,
AUTHOR = "Wu, G.Y. and Liu, H.Y. and Fu, H.M. and Peng, Y.C. and Liu, J.Y. and Fan, X. and Liu, R.S.",
TITLE = "Every SAM Drop Counts: Embracing Semantic Priors for Multi-Modality
Image Fusion and Beyond",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "17882-17891",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113333"}
@inproceedings{bb116745,
AUTHOR = "Tran, Q.H. and Ahmed, M. and Popattia, M. and Ahmed, M.H. and Konin, A. and Zia, M.Z.",
TITLE = "Learning by Aligning 2D Skeleton Sequences and Multi-Modality Fusion",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "L: 141-161",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113334"}
@inproceedings{bb116746,
AUTHOR = "Li, C.X. and Liu, X.Y. and Wang, C. and Liu, Y.F. and Yu, W.H. and Shao, J. and Yuan, Y.X.",
TITLE = "GTP-4O: Modality-prompted Heterogeneous Graph Learning for Omni-modal
Biomedical Representation",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "IV: 168-187",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113335"}
@inproceedings{bb116747,
AUTHOR = "Song, Z.Q. and Wang, L.F.",
TITLE = "Dual Multi-Modal Feature Fusion Network for the Evaluation of
Osteosarcoma",
BOOKTITLE = ICIP24,
YEAR = "2024",
PAGES = "2937-2943",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113336"}
@inproceedings{bb116748,
AUTHOR = "Gao, Z.X. and Jiang, X. and Xu, X. and Shen, F.M. and Li, Y.J. and Shen, H.T.",
TITLE = "Embracing Unimodal Aleatoric Uncertainty for Robust Multimodal Fusion",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "26866-26875",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113337"}
@inproceedings{bb116749,
AUTHOR = "Jiang, H. and Karpur, A. and Cao, B. and Huang, Q.X. and Araujo, A.",
TITLE = "OmniGlue: Generalizable Feature Matching with Foundation Model
Guidance",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "19865-19875",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113338"}
@inproceedings{bb116750,
AUTHOR = "Yi, X.P. and Xu, H. and Zhang, H. and Tang, L.F. and Ma, J.Y.",
TITLE = "Text-IF: Leveraging Semantic Text Guidance for Degradation-Aware and
Interactive Image Fusion",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "27016-27025",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113339"}
@inproceedings{bb116751,
AUTHOR = "Vouitsis, N. and Liu, Z.Y. and Gorti, S.K. and Villecroze, V. and Cresswell, J.C. and Yu, G. and Loaiza Ganem, G. and Volkovs, M.",
TITLE = "Data-Efficient Multimodal Fusion on a Single GPU",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "27229-27241",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113340"}
@inproceedings{bb116752,
AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Zhang, K. and Xu, S. and Chen, D.D. and Timofte, R. and Van Gool, L.J.",
TITLE = "Equivariant Multi-Modality Image Fusion",
BOOKTITLE = CVPR24,
YEAR = "2024",
PAGES = "25912-25921",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113341"}
@inproceedings{bb116753,
AUTHOR = "Han, K.Y. and Cao, F.Z. and Shi, T.X. and Wang, P.",
TITLE = "A Dual Attention Network for Multimodal Remote Sensing Image Matching",
BOOKTITLE = CVIDL23,
YEAR = "2023",
PAGES = "128-134",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113342"}
@inproceedings{bb116754,
AUTHOR = "Liu, B. and Xu, Z.Q. and Bao, X.L. and Zhong, Z.",
TITLE = "MUNformer: A strong encoder that uses multi-level features extracted
by different feature extractors for fusion",
BOOKTITLE = CVIDL23,
YEAR = "2023",
PAGES = "291-295",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113343"}
@inproceedings{bb116755,
AUTHOR = "He, C.M. and Li, K. and Xu, G.X. and Zhang, Y. and Hu, R.Z. and Guo, Z.H. and Li, X.",
TITLE = "Degradation-Resistant Unfolding Network for Heterogeneous Image
Fusion",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "12577-12587",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113344"}
@inproceedings{bb116756,
AUTHOR = "Liu, J.Y. and Liu, Z. and Wu, G.Y. and Ma, L. and Liu, R.S. and Zhong, W. and Luo, Z.X. and Fan, X.",
TITLE = "Multi-interactive Feature Learning and a Full-time Multi-modality
Benchmark for Image Fusion and Segmentation",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "8081-8090",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113345"}
@inproceedings{bb116757,
AUTHOR = "Sippel, F. and Seiler, J. and Kaup, A.",
TITLE = "Cross Spectral Image Reconstruction Using a Deep Guided Neural
Network",
BOOKTITLE = ICIP23,
YEAR = "2023",
PAGES = "226-230",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113346"}
@inproceedings{bb116758,
AUTHOR = "Myers, A. and Kvinge, H. and Emerson, T.",
TITLE = "TopFusion: Using Topological Feature Space for Fusion and Imputation
in Multi-Modal Data",
BOOKTITLE = TAG-PRA23,
YEAR = "2023",
PAGES = "600-609",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113347"}
@inproceedings{bb116759,
AUTHOR = "Xue, Z. and Marculescu, R.",
TITLE = "Dynamic Multimodal Fusion",
BOOKTITLE = MULA23,
YEAR = "2023",
PAGES = "2575-2584",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113348"}
@inproceedings{bb116760,
AUTHOR = "Kong, L.K. and Qi, X.S. and Shen, Q.J. and Wang, J.C. and Zhang, J.Y. and Hu, Y. and Zhou, Q.C.",
TITLE = "Indescribable Multi-Modal Spatial Evaluator",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "9853-9862",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113349"}
@inproceedings{bb116761,
AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Xu, S. and Lin, Z. and Timofte, R. and Van Gool, L.J.",
TITLE = "CDDFuse: Correlation-Driven Dual-Branch Feature Decomposition for
Multi-Modality Image Fusion",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "5906-5916",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113350"}
@inproceedings{bb116762,
AUTHOR = "Li, Y.W. and Quan, R.J. and Zhu, L.C. and Yang, Y.",
TITLE = "Efficient Multimodal Fusion via Interactive Prompting",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "2604-2613",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113351"}
@inproceedings{bb116763,
AUTHOR = "Wetzer, E. and Lindblad, J. and Sladoje, N.",
TITLE = "Can Representation Learning for Multimodal Image Registration be
Improved by Supervision of Intermediate Layers?",
BOOKTITLE = IbPRIA23,
YEAR = "2023",
PAGES = "261-275",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113352"}
@inproceedings{bb116764,
AUTHOR = "Huang, Z.B. and Liu, J.Y. and Fan, X. and Liu, R.S. and Zhong, W. and Luo, Z.X.",
TITLE = "ReCoNet: Recurrent Correction Network for Fast and Efficient
Multi-modality Image Fusion",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XVIII:539-555",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113353"}
@inproceedings{bb116765,
AUTHOR = "Duan, J.L. and Chen, L.Q. and Tran, S. and Yang, J.Y. and Xu, Y. and Zeng, B. and Chilimbi, T.",
TITLE = "Multi-modal Alignment using Representation Codebook",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "15630-15639",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113354"}
@inproceedings{bb116766,
AUTHOR = "Xue, Z.H. and Ren, S.C. and Gao, Z.Q. and Zhao, H.",
TITLE = "Multimodal Knowledge Expansion",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "834-843",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113355"}
@inproceedings{bb116767,
AUTHOR = "Zolfaghari, M. and Zhu, Y. and Gehler, P. and Brox, T.",
TITLE = "CrossCLR: Cross-modal Contrastive Learning For Multi-modal Video
Representations",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "1430-1439",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113356"}
@inproceedings{bb116768,
AUTHOR = "Yang, J.H. and Huang, Y. and Ma, Z.Y. and Wang, L.",
TITLE = "CMF: Cascaded Multi-Model Fusion for Referring Image Segmentation",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2289-2293",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113357"}
@inproceedings{bb116769,
AUTHOR = "Panda, R. and Chen, C.F.R. and Fan, Q.F. and Sun, X. and Saenko, K. and Oliva, A. and Feris, R.S.",
TITLE = "AdaMML: Adaptive Multi-Modal Learning for Efficient Video Recognition",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "7556-7565",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113358"}
@inproceedings{bb116770,
AUTHOR = "Shi, Z.S. and Liang, J. and Li, Q.Q. and Zheng, H.Y. and Gu, Z.R. and Dong, J.Y. and Zheng, B.",
TITLE = "Multi-Modal Multi-Action Video Recognition",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "13658-13667",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113359"}
@inproceedings{bb116771,
AUTHOR = "Huang, S.C. and Shen, L.Y. and Lungren, M.P. and Yeung, S.",
TITLE = "GLoRIA: A Multimodal Global-Local Representation Learning Framework
for Label-efficient Medical Image Recognition",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "3922-3931",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113360"}
@inproceedings{bb116772,
AUTHOR = "Chen, B. and Rouditchenko, A. and Duarte, K. and Kuehne, H. and Thomas, S. and Boggust, A. and Panda, R. and Kingsbury, B. and Feris, R.S. and Harwath, D. and Glass, J. and Picheny, M. and Chang, S.F.",
TITLE = "Multimodal Clustering Networks for Self-supervised Learning from
Unlabeled Videos",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "7992-8001",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113361"}
@inproceedings{bb116773,
AUTHOR = "Liang, T. and Lin, G.S. and Feng, L. and Zhang, Y. and Lv, F.M.",
TITLE = "Attention is not Enough: Mitigating the Distribution Discrepancy in
Asynchronous Multimodal Sequence Fusion",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "8128-8136",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113362"}
@inproceedings{bb116774,
AUTHOR = "Liu, Y.Z. and Fan, Q.N. and Zhang, S.H. and Dong, H. and Funkhouser, T. and Yi, L.",
TITLE = "Contrastive Multimodal Fusion with TupleInfoNCE",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "734-743",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113363"}
@inproceedings{bb116775,
AUTHOR = "Ouerghi, H. and Mourali, O. and Zagrouba, E.",
TITLE = "Multi-modal Image Fusion Based on Weight Local Features and Novel
Sum-modified-laplacian in Non-subsampled Shearlet Transform Domain",
BOOKTITLE = ISVC20,
YEAR = "2020",
PAGES = "II:166-179",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113364"}
@inproceedings{bb116776,
AUTHOR = "Perez Rua, J.M. and Vielzeuf, V. and Pateux, S. and Baccouche, M. and Jurie, F.",
TITLE = "MFAS: Multimodal Fusion Architecture Search",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6959-6968",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113365"}
@inproceedings{bb116777,
AUTHOR = "Sun, S.H. and Hu, J. and Yao, M.Q. and Hu, J.R. and Yang, X.D. and Song, Q. and Wu, X.",
TITLE = "Robust Multimodal Image Registration Using Deep Recurrent Reinforcement
Learning",
BOOKTITLE = ACCV18,
YEAR = "2018",
PAGES = "II:511-526",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113366"}
@inproceedings{bb116778,
AUTHOR = "Vielzeuf, V. and Lechervy, A. and Pateux, S. and Jurie, F.",
TITLE = "CentralNet: A Multilayer Approach for Multimodal Fusion",
BOOKTITLE = MultLearnApp18,
YEAR = "2018",
PAGES = "VI:575-589",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113367"}
@inproceedings{bb116779,
AUTHOR = "Son, C.H. and Zhang, X.P.",
TITLE = "Multimodal fusion via a series of transfers for noise removal",
BOOKTITLE = ICIP17,
YEAR = "2017",
PAGES = "530-534",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113368"}
@inproceedings{bb116780,
AUTHOR = "Shrivastava, A. and Rastegari, M. and Shekhar, S. and Chellappa, R. and Davis, L.S.",
TITLE = "Class consistent multi-modal fusion with binary features",
BOOKTITLE = CVPR15,
YEAR = "2015",
PAGES = "2282-2291",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113369"}
@inproceedings{bb116781,
AUTHOR = "Kasiri, K. and Fieguth, P.W. and Clausi, D.A.",
TITLE = "Self-similarity measure for multi-modal image registration",
BOOKTITLE = ICIP16,
YEAR = "2016",
PAGES = "4498-4502",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113370"}
@inproceedings{bb116782,
AUTHOR = "Kasiri, K. and Fieguth, P.W. and Clausi, D.A.",
TITLE = "Structural Representations for Multi-modal Image Registration Based on
Modified Entropy",
BOOKTITLE = ICIAR15,
YEAR = "2015",
PAGES = "82-89",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113371"}
@inproceedings{bb116783,
AUTHOR = "Zhang, H. and Chen, L. and Liu, J. and Yuan, J.S.",
TITLE = "Hierarchical multi-feature fusion for multimodal data analysis",
BOOKTITLE = ICIP14,
YEAR = "2014",
PAGES = "5916-5920",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113372"}
@inproceedings{bb116784,
AUTHOR = "Shen, X.Y. and Xu, L. and Zhang, Q. and Jia, J.Y.",
TITLE = "Multi-modal and Multi-spectral Registration for Natural Images",
BOOKTITLE = ECCV14,
YEAR = "2014",
PAGES = "IV: 309-324",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113373"}
@inproceedings{bb116785,
AUTHOR = "Sahoo, S. and Nanda, P.K. and Samant, S.",
TITLE = "Tsallis and Renyi's embedded entropy based mutual information for
multimodal image registration",
BOOKTITLE = NCVPRIPG13,
YEAR = "2013",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113374"}
@inproceedings{bb116786,
AUTHOR = "Kim, M.J. and Han, D.K. and Ko, H.S.",
TITLE = "Multimodal image fusion via sparse representation with local patch
dictionaries",
BOOKTITLE = ICIP13,
YEAR = "2013",
PAGES = "1301-1305",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113375"}
@inproceedings{bb116787,
AUTHOR = "Glodek, M. and Schels, M. and Palm, G. and Schwenker, F.",
TITLE = "Multi-modal Fusion based on classifiers using reject options and Markov
Fusion Networks",
BOOKTITLE = ICPR12,
YEAR = "2012",
PAGES = "1084-1087",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113376"}
@inproceedings{bb116788,
AUTHOR = "Forsberg, D. and Farneback, G. and Knutsson, H. and Westin, C.F.",
TITLE = "Multi-modal Image Registration Using Polynomial Expansion and Mutual
Information",
BOOKTITLE = WBIR12,
YEAR = "2012",
PAGES = "40-49",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113377"}
@inproceedings{bb116789,
AUTHOR = "Bodensteiner, C. and Huebner, W. and Jueng Ling, K. and Mueller, J. and Arens, M.",
TITLE = "Local multi-modal image matching based on self-similarity",
BOOKTITLE = ICIP10,
YEAR = "2010",
PAGES = "937-940",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113378"}
@inproceedings{bb116790,
AUTHOR = "Vegh, V. and Yang, Z.Y. and Tieng, Q.M. and Reutens, D.C.",
TITLE = "Multimodal image registration using stochastic differential equation
optimization",
BOOKTITLE = ICIP10,
YEAR = "2010",
PAGES = "4385-4388",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113379"}
@inproceedings{bb116791,
AUTHOR = "Peng, T.Y. and Yigitsoy, M. and Eslami, A. and Bayer, C. and Navab, N.",
TITLE = "Deformable Registration of Multi-modal Microscopic Images Using a
Pyramidal Interactive Registration-Learning Methodology",
BOOKTITLE = WBIR14,
YEAR = "2014",
PAGES = "144-153",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113380"}
@inproceedings{bb116792,
AUTHOR = "Wachinger, C. and Navab, N.",
TITLE = "Manifold Learning for Multi-modal Image Registration",
BOOKTITLE = BMVC10,
YEAR = "2010",
PAGES = "xx-yy",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113381"}
@inproceedings{bb116793,
AUTHOR = "Xu, J. and Yuan, J.S. and Wu, Y.",
TITLE = "Multimodal Partial Estimates Fusion",
BOOKTITLE = ICCV09,
YEAR = "2009",
PAGES = "2177-2184",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113382"}
@inproceedings{bb116794,
AUTHOR = "Ma, W.Y. and Li, S. and Yao, Y.F. and Lan, C. and Gao, S.Q. and Tang, H. and Jing, X.Y.",
TITLE = "Multi-Modal Biometrics Pixel Level Fusion and KPCA-RBF Feature
Classification for Single Sample Recognition Problem",
BOOKTITLE = CISP09,
YEAR = "2009",
PAGES = "1-5",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113383"}
@inproceedings{bb116795,
AUTHOR = "Town, C. and Zhu, Z.G.",
TITLE = "Sensor Fusion and Environmental Modelling for Multimodal Sentient
Computing",
BOOKTITLE = MSCSAS07,
YEAR = "2007",
PAGES = "1-2",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113384"}
@inproceedings{bb116796,
AUTHOR = "Datar, M. and Gopalakrishnan, G. and Ranjan, S. and Mullick, R.",
TITLE = "Anatomically Guided Registration for Multimodal Images",
BOOKTITLE = AIPR06,
YEAR = "2006",
PAGES = "10-10",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113385"}
@inproceedings{bb116797,
AUTHOR = "Gopalakrishnan, G. and Kumar, S.V.B. and Narayanan, A. and Mullick, R.",
TITLE = "A fast piecewise deformable method for multi-modality image
registration",
BOOKTITLE = AIPR05,
YEAR = "2005",
PAGES = "114-119",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113386"}
@inproceedings{bb116798,
AUTHOR = "Kelman, A. and Sofka, M. and Stewart, C.V.",
TITLE = "Keypoint Descriptors for Matching Across Multiple Image Modalities and
Non-linear Intensity Variations",
BOOKTITLE = Fusion07,
YEAR = "2007",
PAGES = "1-7",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113387"}
@inproceedings{bb116799,
AUTHOR = "Guo, Y.J. and Lu, C.C.",
TITLE = "Multi-modality Image Registration Using Mutual Information Based on
Gradient Vector Flow",
BOOKTITLE = ICPR06,
YEAR = "2006",
PAGES = "III: 697-700",
BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT113388"}
Last update:Jun 4, 2026 at 16:38:45