@article{bb115700,
        AUTHOR = "Han, W.C. and Dong, X.P. and Zhang, Y.Y. and Crandall, D. and Xu, C.Z. and Shen, J.B.",
        TITLE = "Asymmetric Convolution: An Efficient and Generalized Method to Fuse
Feature Maps in Multiple Vision Tasks",
        JOURNAL = PAMI,
        VOLUME = "46",
        YEAR = "2024",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "7363-7376",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112290"}

@article{bb115701,
        AUTHOR = "Wu, Q. and Yu, Q.",
        TITLE = "A Fast Sequential Similarity Detection Algorithm for Multi-Source
Image Matching",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "19",
        PAGES = "3589",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112291"}

@article{bb115702,
        AUTHOR = "Saidi, S. and Idbraim, S. and Karmoude, Y. and Masse, A. and Arbelo, M.",
        TITLE = "Deep-Learning for Change Detection Using Multi-Modal Fusion of Remote
Sensing Images: A Review",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "20",
        PAGES = "3852",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112292"}

@article{bb115703,
        AUTHOR = "Liu, Y.Y. and He, W. and Zhang, H.Y.",
        TITLE = "GRiD: Guided Refinement for Detector-Free Multimodal Image Matching",
        JOURNAL = IP,
        VOLUME = "33",
        YEAR = "2024",
        PAGES = "5892-5906",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112293"}

@article{bb115704,
        AUTHOR = "Wang, J.P. and Su, N. and Zhao, C.H. and Yan, Y.M. and Feng, S.",
        TITLE = "Multi-Modal Object Detection Method Based on Dual-Branch Asymmetric
Attention Backbone and Feature Fusion Pyramid Network",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "20",
        PAGES = "3904",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112294"}

@article{bb115705,
        AUTHOR = "Liu, Y. and Liu, F. and Jiao, L.C. and Bao, Q.Y. and Sun, L. and Li, S. and Li, L.L. and Liu, X.",
        TITLE = "Multi-Grained Gradual Inference Model for Multimedia Event Extraction",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "10507-10520",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112295"}

@article{bb115706,
        AUTHOR = "Wang, X.X. and Fang, L.X. and Zhao, J.L. and Pan, Z.K. and Li, H. and Li, Y.",
        TITLE = "MMAE: A universal image fusion method via mask attention mechanism",
        JOURNAL = PR,
        VOLUME = "158",
        YEAR = "2025",
        PAGES = "111041",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112296"}

@article{bb115707,
        AUTHOR = "Zhang, D. and Bashar, M.A. and Nayak, R.",
        TITLE = "A novel multi-modal fusion method based on uncertainty-guided
meta-learning",
        JOURNAL = PR,
        VOLUME = "158",
        YEAR = "2025",
        PAGES = "110993",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112297"}

@article{bb115708,
        AUTHOR = "Lv, T. and Ji, C.M. and Jiang, H. and Liu, Y.",
        TITLE = "HF2TNet: A Hierarchical Fusion Two-Stage Training Network for
Infrared and Visible Image Fusion",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "3164-3168",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112298"}

@article{bb115709,
        AUTHOR = "Meng, X.C. and Chen, C.Q. and Liu, Q. and Shao, F.",
        TITLE = "Multi-domain pseudo-reference quality evaluation for infrared and
visible image fusion",
        JOURNAL = IET-IPR,
        VOLUME = "18",
        YEAR = "2024",
        NUMBER = "13",
        PAGES = "4095-4113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112299"}

@article{bb115710,
        AUTHOR = "Bai, Y. and Gao, M. and Li, S.Y. and Wang, P. and Guan, N. and Yin, H.Z. and Yan, Y.H.",
        TITLE = "IBFusion: An Infrared and Visible Image Fusion Method Based on
Infrared Target Mask and Bimodal Feature Extraction Strategy",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "10610-10622",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112300"}

@article{bb115711,
        AUTHOR = "Wang, X.X. and Fang, L.X. and Zhao, J.L. and Pan, Z.K. and Li, H. and Li, Y.",
        TITLE = "UUD-Fusion: An unsupervised universal image fusion approach via
generative diffusion model",
        JOURNAL = CVIU,
        VOLUME = "249",
        YEAR = "2024",
        PAGES = "104218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112301"}

@article{bb115712,
        AUTHOR = "Dong, A. and Wang, L. and Liu, J. and Xu, J.Y. and Zhao, G.X. and Zhai, Y. and Lv, G.H. and Cheng, J.",
        TITLE = "Co-Enhancement of Multi-Modality Image Fusion and Object Detection
via Feature Adaptation",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "12624-12637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112302"}

@article{bb115713,
        AUTHOR = "Wu, X. and Cao, Z.H. and Huang, T.Z. and Deng, L.J. and Chanussot, J. and Vivone, G.",
        TITLE = "Fully-Connected Transformer for Multi-Source Image Fusion",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "2071-2088",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112303"}

@article{bb115714,
        AUTHOR = "Cao, Z.H. and Liang, Y.J. and Deng, L.J. and Vivone, G.",
        TITLE = "An Efficient Image Fusion Network Exploiting Unifying Language and
Mask Guidance",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "9845-9862",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112304"}

@article{bb115715,
        AUTHOR = "Hussain, I. and Tan, S.Q. and Huang, J.W.",
        TITLE = "Few-Shot Based Learning Recaptured Image Detection with Multi-Scale
Feature Fusion and Attention",
        JOURNAL = PR,
        VOLUME = "161",
        YEAR = "2025",
        PAGES = "111248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112305"}

@article{bb115716,
        AUTHOR = "Tang, H. and Liu, D.W. and Shen, C.C.",
        TITLE = "Data-efficient multi-scale fusion vision transformer",
        JOURNAL = PR,
        VOLUME = "161",
        YEAR = "2025",
        PAGES = "111305",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112306"}

@article{bb115717,
        AUTHOR = "Liu, T.F. and Zhang, M.Y. and Gong, M. and Zhang, Q.F. and Jiang, F.L. and Zheng, H.H. and Lu, D.",
        TITLE = "Commonality Feature Representation Learning for Unsupervised
Multimodal Change Detection",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "1219-1233",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112307"}

@article{bb115718,
        AUTHOR = "Xu, J.J. and Liu, T.F. and Lei, T. and Chen, H.R.X. and Yokoya, N. and Lv, Z.Y. and Gong, M.",
        TITLE = "CGSL: Commonality graph structure learning for unsupervised
multimodal change detection",
        JOURNAL = PandRS,
        VOLUME = "229",
        YEAR = "2025",
        PAGES = "92-106",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112308"}

@article{bb115719,
        AUTHOR = "Liu, Z.W. and Cheng, J. and Fan, J. and Lin, S. and Wang, Y. and Zhao, X.M.",
        TITLE = "Multi-Modal Fusion Based on Depth Adaptive Mechanism for 3D Object
Detection",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "707-717",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112309"}

@article{bb115720,
        AUTHOR = "Dong, C. and Wang, L.Z. and Zhang, F. and Hua, Q.",
        TITLE = "Multi-modal Few-shot Image Recognition with enhanced semantic and
visual integration",
        JOURNAL = IVC,
        VOLUME = "157",
        YEAR = "2025",
        PAGES = "105490",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112310"}

@article{bb115721,
        AUTHOR = "Tang, L. and Liu, Y. and Tian, Y.J. and Pardalos, P.M.",
        TITLE = "Complementary label learning with multi-view data and a
semi-supervised labeling mechanism",
        JOURNAL = PR,
        VOLUME = "165",
        YEAR = "2025",
        PAGES = "111651",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112311"}

@article{bb115722,
        AUTHOR = "Zhou, M. and Huang, J. and Yan, K.Y. and Hong, D.F. and Jia, X.P. and Chanussot, J. and Li, C.Y.",
        TITLE = "A General Spatial-Frequency Learning Framework for Multimodal Image
Fusion",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "5281-5298",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112312"}

@article{bb115723,
        AUTHOR = "Wang, Z. and Zhao, L. and Zhang, J.Z. and Song, R. and Song, H.Y. and Meng, J. and Wang, S.D.",
        TITLE = "Multi-Text Guidance Is Important: Multi-Modality Image Fusion via Large
Generative Vision-Language Model",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4646-4668",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112313"}

@article{bb115724,
        AUTHOR = "Liu, Y. and Li, C.X. and Xu, S.K. and Han, J.G.",
        TITLE = "Part-Whole Relational Fusion Towards Multi-Modal Scene Understanding",
        JOURNAL = IJCV,
        VOLUME = "133",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "4483-4503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112314"}

@article{bb115725,
        AUTHOR = "Ravi, J. and Narmadha, R.",
        TITLE = "A Systematic Literature Review on Multimodal Image Fusion Models with
Challenges and Future Research Trends",
        JOURNAL = IJIG,
        VOLUME = "25",
        YEAR = "2025",
        NUMBER = "4",
        MONTH = "July",
        PAGES = "2550039",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112315"}

@article{bb115726,
        AUTHOR = "Liu, Y.P. and Sun, Z.C. and Yu, B.S. and Zhao, Y.T. and Du, B. and Xu, Y.C. and Cheng, J.",
        TITLE = "MIFNet: Learning Modality-Invariant Features for Generalizable
Multimodal Image Matching",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "3593-3608",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112316"}

@article{bb115727,
        AUTHOR = "Yang, Z. and Song, N. and Li, W. and Zhu, X.T. and Zhang, L. and Torr, P.H.S.",
        TITLE = "DeepInteraction++: Multi-Modality Interaction for Autonomous Driving",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6749-6763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112317"}

@article{bb115728,
        AUTHOR = "Lu, M. and Jiang, M. and Tao, X.F. and Kong, J.",
        TITLE = "AU-Net: Adaptive Unified Network for Joint Multi-Modal Image
Registration and Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "4721-4735",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112318"}

@article{bb115729,
        AUTHOR = "Wang, Q.H. and Li, Z.W. and Zhang, S.Q. and Chi, N. and Dai, Q.H.",
        TITLE = "WaveFusion: A Novel Wavelet Vision Transformer With Saliency-Guided
Enhancement for Multimodal Image Fusion",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "7526-7542",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112319"}

@article{bb115730,
        AUTHOR = "Liang, P.W. and Jiang, J.J. and Ma, Q. and Wang, C.Y. and Liu, X.M. and Ma, J.Y.",
        TITLE = "FusionINV: A Diffusion-Based Approach for Multimodal Image Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "5355-5368",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112320"}

@article{bb115731,
        AUTHOR = "Shi, L.T. and Zhong, B. and Liang, Q.H. and Hu, X.T. and Mo, Z.Y. and Song, S.X.",
        TITLE = "Mamba Adapter: Efficient Multi-Modal Fusion for Vision-Language
Tracking",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "9300-9311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112321"}

@article{bb115732,
        AUTHOR = "Liu, X.Y. and Ming, R. and Du, S.L. and He, L.H. and Luo, H.B. and Xiao, G.",
        TITLE = "HSENet: Hierarchical Semantic-Enriched Network for Multi-Modal Image
Fusion",
        JOURNAL = PR,
        VOLUME = "170",
        YEAR = "2026",
        PAGES = "112043",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112322"}

@article{bb115733,
        AUTHOR = "Zavras, A. and Michail, D. and Demir, B. and Papoutsis, I.",
        TITLE = "Mind the modality gap: Towards a remote sensing vision-language model
via cross-modal alignment",
        JOURNAL = PandRS,
        VOLUME = "228",
        YEAR = "2025",
        PAGES = "270-287",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112323"}

@article{bb115734,
        AUTHOR = "Cheng, T. and Chen, H. and Zhang, X.H. and Gao, X.W. and Yin, L. and Jiao, J.B.",
        TITLE = "Multi-Channel Spatio-Temporal Data Fusion of 'Big' and 'Small'
Network Data Using Transformer Networks",
        JOURNAL = IJGI,
        VOLUME = "14",
        YEAR = "2025",
        NUMBER = "8",
        PAGES = "286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112324"}

@article{bb115735,
        AUTHOR = "Hu, J.J. and Fan, C. and Ozay, M. and Gao, Q. and Guo, Y.L. and Lam, T.L.",
        TITLE = "Robust Depth Estimation Under Sensor Degradations:
A Multi-Sensor Fusion Perspective",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "8691-8707",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112325"}

@article{bb115736,
        AUTHOR = "Xin, J.W. and Shi, B. and Wang, N.N. and Li, J. and Gao, X.B.",
        TITLE = "MVFusion: Generative Representation Learning With Masked Variational
Autoencoders for Multi-Modality Image Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "6418-6431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112326"}

@article{bb115737,
        AUTHOR = "Zheng, T.H. and Dong, G.L. and Zhang, P.P. and He, X. and Ren, C.",
        TITLE = "Plug-and-Play General Image Registration for Misaligned Multi-Modal
Image Fusion",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "10017-10031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112327"}

@article{bb115738,
        AUTHOR = "Jiao, S.C. and Long, L. and Kuang, L.Q. and Xiong, F.G. and Han, X.",
        TITLE = "Multi-modal semantic embedding network for 3D shape recognition and
retrieval",
        JOURNAL = JVCIR,
        VOLUME = "112",
        YEAR = "2025",
        PAGES = "104559",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112328"}

@article{bb115739,
        AUTHOR = "Sun, H. and Lv, L. and Zhang, P.P. and Tang, T. and Tian, F. and Sun, W. and Lu, H.C.",
        TITLE = "Spatial-Frequency Enhanced Mamba for Multi-Modal Image Fusion",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "7684-7696",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112329"}

@article{bb115740,
        AUTHOR = "Sun, Y.J. and Dong, W.S. and Wang, S. and Wu, P. and Feng, M.T. and Li, X. and Shi, G.M.",
        TITLE = "Distilling Hierarchical Knowledge From Multimodal Fusion for Unimodal
Image Segmentation",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "11797-11809",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112330"}

@article{bb115741,
        AUTHOR = "Hu, S. and Liu, T. and Han, L.Y. and Xing, R.",
        TITLE = "Vision-language tracking with attention-based optimization",
        JOURNAL = JVCIR,
        VOLUME = "114",
        YEAR = "2026",
        PAGES = "104644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112331"}

@article{bb115742,
        AUTHOR = "Yu, C.B. and Pei, Z.H. and Wang, X.R. and Zhou, H.B.",
        TITLE = "CrossGlue: Cross-Modal Image matching via potential message
investigation and visual-gradient message integration",
        JOURNAL = JVCIR,
        VOLUME = "114",
        YEAR = "2026",
        PAGES = "104620",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112332"}

@article{bb115743,
        AUTHOR = "Zhou, D.D. and Xu, L. and Wu, K. and Liu, H.Z. and Jiang, M.T.",
        TITLE = "DSEPGAN: A Dual-Stream Enhanced Pyramid Based on Generative
Adversarial Network for Spatiotemporal Image Fusion",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "24",
        PAGES = "4050",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112333"}

@article{bb115744,
        AUTHOR = "Jiang, J.L. and Hu, G. and Sheng, G.L. and Wei, G.",
        TITLE = "PSG-MCANet: Multi-order cross-attention modeling for multimodal
fusion based on punning semantic guidance",
        JOURNAL = PR,
        VOLUME = "172",
        YEAR = "2026",
        PAGES = "112723",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112334"}

@article{bb115745,
        AUTHOR = "Li, M.Y. and Meng, C. and Fan, X.D.",
        TITLE = "Iterative optimal transport for multimodal image registration",
        JOURNAL = PR,
        VOLUME = "172",
        YEAR = "2026",
        PAGES = "112736",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112335"}

@article{bb115746,
        AUTHOR = "Wang, Y.X. and Shen, Z.W. and Li, H. and Zhang, Y.N. and Xia, Z.P.",
        TITLE = "SGCNet: Silhouette Guided Cascaded Network for Multi-Modal Image
Fusion",
        JOURNAL = CVIU,
        VOLUME = "263",
        YEAR = "2026",
        PAGES = "104603",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112336"}

@article{bb115747,
        AUTHOR = "He, D. and Wang, G.F. and Li, W.S. and Shu, Y.C. and Li, W.B. and Yang, L.J. and Huang, Y.P. and Li, F.Y.",
        TITLE = "Rethinking normalization strategies and convolutional kernels for
multimodal image fusion",
        JOURNAL = PR,
        VOLUME = "173",
        YEAR = "2026",
        PAGES = "112903",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112337"}

@article{bb115748,
        AUTHOR = "Ning, T. and Lu, K. and Jiang, X. and Xue, J.",
        TITLE = "Mambafusion: State-space model-driven object-scene fusion for
multi-modal 3D object detection",
        JOURNAL = PR,
        VOLUME = "173",
        YEAR = "2026",
        PAGES = "112820",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112338"}

@article{bb115749,
        AUTHOR = "Li, S.T. and Tang, H.",
        TITLE = "Multimodal Alignment and Fusion: A Survey",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "103",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112339"}

@article{bb115750,
        AUTHOR = "Fu, Y. and Ye, X. and Kong, X.Y.",
        TITLE = "KPTFusion: Knowledge Prior-based Task-Driven Multimodal Image Fusion",
        JOURNAL = IVC,
        VOLUME = "167",
        YEAR = "2026",
        PAGES = "105886",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112340"}

@article{bb115751,
        AUTHOR = "Qin, X.R. and Cui, Y.N. and Sun, S.Q. and Chen, R. and Ren, W.Q. and Knoll, A. and Cao, X.C.",
        TITLE = "Disentangle to Fuse: Toward Content Preservation and Cross-Modality
Consistency for Multi-Modality Image Fusion",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "1756-1770",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112341"}

@article{bb115752,
        AUTHOR = "Chen, H. and Zhou, H.R. and Zhang, Y. and Lin, Z. and Deng, Y.J.",
        TITLE = "Dissecting RGB-D Learning for Improved Multi-Modal Fusion",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "1846-1857",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112342"}

@article{bb115753,
        AUTHOR = "Zhang, J.J. and Zhao, F. and Liu, H.Q. and Yu, J.",
        TITLE = "Generative Information-Guided Heterogeneous Cross-Fusion Network With
Contrastive Learning for Multimodal Remote Sensing Image
Classification",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1876-1892",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112343"}

@article{bb115754,
        AUTHOR = "Ning, Z.W. and Liu, Z.J. and Gao, X. and Zuo, Y.F. and Yang, J. and Fang, Y.M. and Liu, W.",
        TITLE = "CMF-IoU: Multi-Stage Cross-Modal Fusion 3D Object Detection With IoU
Joint Prediction",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "2177-2190",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112344"}

@article{bb115755,
        AUTHOR = "Mutakabbir, A. and Lung, C.H. and Zaman, M. and Upadhyay, D. and Naik, K. and Millard, K. and Ravichandran, T. and Purcell, R.",
        TITLE = "NOAH: A Multi-Modal and Sensor Fusion Dataset for Generative Modeling
in Remote Sensing",
        JOURNAL = RS,
        VOLUME = "18",
        YEAR = "2026",
        NUMBER = "3",
        PAGES = "466",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112345"}

@article{bb115756,
        AUTHOR = "Rao, J.H. and Liu, R. and Guan, J.J. and Tian, X.",
        TITLE = "AMS-Former: Adaptive multi-scale transformer for multi-modal image
matching",
        JOURNAL = PandRS,
        VOLUME = "232",
        YEAR = "2026",
        PAGES = "957-973",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112346"}

@article{bb115757,
        AUTHOR = "Cao, J.Z. and Chen, J.S. and Wang, X.X. and Huang, W.M. and Chen, D.S. and Zhao, T.H. and Tu, W. and Li, Q.Q.",
        TITLE = "UrbanMMCL: Urban region representations via multi-modal and
multi-graph self-supervised contrastive learning",
        JOURNAL = PandRS,
        VOLUME = "232",
        YEAR = "2026",
        PAGES = "75-93",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112347"}

@article{bb115758,
        AUTHOR = "Lu, R. and Zhuo, Z.H. and Wang, S. and Fan, J. and Shen, T. and Yang, X.G.",
        TITLE = "SAMKD: A Hybrid Lightweight Algorithm Based on Selective Activation
and Masked Knowledge Distillation for Multimodal Object Detection",
        JOURNAL = RS,
        VOLUME = "18",
        YEAR = "2026",
        NUMBER = "3",
        PAGES = "450",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112348"}

@article{bb115759,
        AUTHOR = "Ying, Z.H. and Guo, J. and Li, Y.S. and Gao, Y. and Li, C.Y.",
        TITLE = "Diff-Transformer: Heterogeneous Feature Fusion Network for
Multisource Remote Sensing Classification",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1501-1516",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112349"}

@article{bb115760,
        AUTHOR = "Zhang, Y. and Xie, W.Y. and Hui, T.L. and Li, D.X. and Zhang, J.Q. and Lei, J. and Li, Y.S. and Fang, L.Y.",
        TITLE = "LoME: LoRA-Driven Multimodal Extractor for RGB-X Vision Tasks",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1487-1500",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112350"}

@article{bb115761,
        AUTHOR = "Yang, Z. and Dong, Y.P. and Wang, J.Y. and Wang, H. and Ma, L.C. and Cui, Z.J. and Liu, Q. and Pei, H.R. and Zhang, K. and Zhang, C.",
        TITLE = "DAOcc: 3D Object Detection Assisted Multi-Sensor Fusion for 3D
Occupancy Prediction",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1742-1753",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112351"}

@inproceedings{bb115762,
        AUTHOR = "Xue, F. and Elflein, S. and Leal Taixe, L. and Zhou, Q.",
        TITLE = "MATCHA: Towards Matching Anything",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "27081-27091",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112352"}

@inproceedings{bb115763,
        AUTHOR = "Shrivastava, A. and Owens, A.",
        TITLE = "Self-Supervised Spatial Correspondence Across Modalities",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "6383-6393",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112353"}

@inproceedings{bb115764,
        AUTHOR = "Zhou, B. and Li, L. and Wang, Y.J. and Liu, H.F. and Yao, Y.Z. and Wang, W.G.",
        TITLE = "UniAlign: Scaling Multimodal Alignment within One Unified Model",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29644-29655",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112354"}

@inproceedings{bb115765,
        AUTHOR = "Hou, J.M. and Chen, X.Y. and Ran, R. and Cong, X.F. and Liu, X.Y. and You, J.W. and Deng, L.J.",
        TITLE = "Binarized Neural Network for Multi-spectral Image Fusion",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "2236-2245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112355"}

@inproceedings{bb115766,
        AUTHOR = "Li, Y. and Xing, Y.F. and Lan, X.Y. and Li, X. and Chen, H.F. and Jiang, D.M.",
        TITLE = "AlignMamba: Enhancing Multimodal Mamba with Local and Global
Cross-Modal Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "24774-24784",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112356"}

@inproceedings{bb115767,
        AUTHOR = "Maniparambil, M. and Akshulakov, R. and Djilali, Y.A.D. and Narayan, S. and Singh, A. and O'Connor, N.E.",
        TITLE = "Harnessing Frozen Unimodal Encoders for Flexible Multimodal Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29847-29857",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112357"}

@inproceedings{bb115768,
        AUTHOR = "Li, H. and Hou, Y.N. and Xing, X.H. and Ma, Y.X. and Sun, X. and Zhang, Y.",
        TITLE = "OccMamba: Semantic Occupancy Prediction with State Space Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "11949-11959",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112358"}

@inproceedings{bb115769,
        AUTHOR = "Chen, L. and Wang, J. and Mortlock, T. and Khargonekar, P. and Faruque, M.A.A.",
        TITLE = "Hyperdimensional Uncertainty Quantification for Multimodal
Uncertainty Fusion in Autonomous Vehicles Perception",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "22306-22316",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112359"}

@inproceedings{bb115770,
        AUTHOR = "Wu, G.Y. and Liu, H.Y. and Fu, H.M. and Peng, Y.C. and Liu, J.Y. and Fan, X. and Liu, R.S.",
        TITLE = "Every SAM Drop Counts: Embracing Semantic Priors for Multi-Modality
Image Fusion and Beyond",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "17882-17891",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112360"}

@inproceedings{bb115771,
        AUTHOR = "Mei, S.B. and Ni, B.B. and Wang, H. and Zhao, C.L. and Hu, F. and Pi, Z.M. and Ke, B.",
        TITLE = "Object-Oriented Anchoring and Modal Alignment in Multimodal Learning",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "L: 179-196",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112361"}

@inproceedings{bb115772,
        AUTHOR = "Tran, Q.H. and Ahmed, M. and Popattia, M. and Ahmed, M.H. and Konin, A. and Zia, M.Z.",
        TITLE = "Learning by Aligning 2D Skeleton Sequences and Multi-Modality Fusion",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "L: 141-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112362"}

@inproceedings{bb115773,
        AUTHOR = "Li, C.X. and Liu, X.Y. and Wang, C. and Liu, Y.F. and Yu, W.H. and Shao, J. and Yuan, Y.X.",
        TITLE = "GTP-4O: Modality-prompted Heterogeneous Graph Learning for Omni-modal
Biomedical Representation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "IV: 168-187",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112363"}

@inproceedings{bb115774,
        AUTHOR = "Song, Z.Q. and Wang, L.F.",
        TITLE = "Dual Multi-Modal Feature Fusion Network for the Evaluation of
Osteosarcoma",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "2937-2943",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112364"}

@inproceedings{bb115775,
        AUTHOR = "Bahaduri, B. and Ming, Z.H. and Feng, F.C. and Mokraoui, A.",
        TITLE = "Multimodal Transformer Using Cross-Channel Attention for Object
Detection in Remote Sensing Images",
        BOOKTITLE = ICIP24,
        YEAR = "2024",
        PAGES = "2620-2626",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112365"}

@inproceedings{bb115776,
        AUTHOR = "Gao, Z.X. and Jiang, X. and Xu, X. and Shen, F.M. and Li, Y.J. and Shen, H.T.",
        TITLE = "Embracing Unimodal Aleatoric Uncertainty for Robust Multimodal Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "26866-26875",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112366"}

@inproceedings{bb115777,
        AUTHOR = "Jiang, H. and Karpur, A. and Cao, B. and Huang, Q.X. and Araujo, A.",
        TITLE = "OmniGlue: Generalizable Feature Matching with Foundation Model
Guidance",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "19865-19875",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112367"}

@inproceedings{bb115778,
        AUTHOR = "Yi, X.P. and Xu, H. and Zhang, H. and Tang, L.F. and Ma, J.Y.",
        TITLE = "Text-IF: Leveraging Semantic Text Guidance for Degradation-Aware and
Interactive Image Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "27016-27025",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112368"}

@inproceedings{bb115779,
        AUTHOR = "Vouitsis, N. and Liu, Z.Y. and Gorti, S.K. and Villecroze, V. and Cresswell, J.C. and Yu, G. and Loaiza Ganem, G. and Volkovs, M.",
        TITLE = "Data-Efficient Multimodal Fusion on a Single GPU",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "27229-27241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112369"}

@inproceedings{bb115780,
        AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Zhang, K. and Xu, S. and Chen, D.D. and Timofte, R. and Van Gool, L.J.",
        TITLE = "Equivariant Multi-Modality Image Fusion",
        BOOKTITLE = CVPR24,
        YEAR = "2024",
        PAGES = "25912-25921",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112370"}

@inproceedings{bb115781,
        AUTHOR = "Li, X. and Li, X.S. and Ye, T. and Cheng, X.Q. and Liu, W.Y. and Tan, H.",
        TITLE = "Bridging the Gap between Multi-focus and Multi-modal: A Focused
Integration Framework for Multi-modal Image Fusion",
        BOOKTITLE = WACV24,
        YEAR = "2024",
        PAGES = "1617-1626",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112371"}

@inproceedings{bb115782,
        AUTHOR = "Han, K.Y. and Cao, F.Z. and Shi, T.X. and Wang, P.",
        TITLE = "A Dual Attention Network for Multimodal Remote Sensing Image Matching",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "128-134",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112372"}

@inproceedings{bb115783,
        AUTHOR = "Liu, B. and Xu, Z.Q. and Bao, X.L. and Zhong, Z.",
        TITLE = "MUNformer: A strong encoder that uses multi-level features extracted
by different feature extractors for fusion",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "291-295",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112373"}

@inproceedings{bb115784,
        AUTHOR = "He, C.M. and Li, K. and Xu, G.X. and Zhang, Y. and Hu, R.Z. and Guo, Z.H. and Li, X.",
        TITLE = "Degradation-Resistant Unfolding Network for Heterogeneous Image
Fusion",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "12577-12587",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112374"}

@inproceedings{bb115785,
        AUTHOR = "Liu, J.Y. and Liu, Z. and Wu, G.Y. and Ma, L. and Liu, R.S. and Zhong, W. and Luo, Z.X. and Fan, X.",
        TITLE = "Multi-interactive Feature Learning and a Full-time Multi-modality
Benchmark for Image Fusion and Segmentation",
        BOOKTITLE = ICCV23,
        YEAR = "2023",
        PAGES = "8081-8090",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112375"}

@inproceedings{bb115786,
        AUTHOR = "Sippel, F. and Seiler, J. and Kaup, A.",
        TITLE = "Cross Spectral Image Reconstruction Using a Deep Guided Neural
Network",
        BOOKTITLE = ICIP23,
        YEAR = "2023",
        PAGES = "226-230",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112376"}

@inproceedings{bb115787,
        AUTHOR = "Myers, A. and Kvinge, H. and Emerson, T.",
        TITLE = "TopFusion: Using Topological Feature Space for Fusion and Imputation
in Multi-Modal Data",
        BOOKTITLE = TAG-PRA23,
        YEAR = "2023",
        PAGES = "600-609",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112377"}

@inproceedings{bb115788,
        AUTHOR = "Xue, Z. and Marculescu, R.",
        TITLE = "Dynamic Multimodal Fusion",
        BOOKTITLE = MULA23,
        YEAR = "2023",
        PAGES = "2575-2584",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112378"}

@inproceedings{bb115789,
        AUTHOR = "Li, X. and Ma, T. and Hou, Y.N. and Shi, B. and Yang, Y.C. and Liu, Y. and Wu, X.J. and Chen, Q. and Li, Y.K. and Qiao, Y. and He, L.",
        TITLE = "LoGoNet: Towards Accurate 3D Object Detection with Local-to-Global
Cross-Modal Fusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "17524-17534",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112379"}

@inproceedings{bb115790,
        AUTHOR = "Kong, L.K. and Qi, X.S. and Shen, Q.J. and Wang, J.C. and Zhang, J.Y. and Hu, Y. and Zhou, Q.C.",
        TITLE = "Indescribable Multi-Modal Spatial Evaluator",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "9853-9862",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112380"}

@inproceedings{bb115791,
        AUTHOR = "Zhao, Z.X. and Bai, H.W. and Zhang, J.S. and Zhang, Y. and Xu, S. and Lin, Z. and Timofte, R. and Van Gool, L.J.",
        TITLE = "CDDFuse: Correlation-Driven Dual-Branch Feature Decomposition for
Multi-Modality Image Fusion",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "5906-5916",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112381"}

@inproceedings{bb115792,
        AUTHOR = "Li, Y.W. and Quan, R.J. and Zhu, L.C. and Yang, Y.",
        TITLE = "Efficient Multimodal Fusion via Interactive Prompting",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "2604-2613",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112382"}

@inproceedings{bb115793,
        AUTHOR = "Wetzer, E. and Lindblad, J. and Sladoje, N.",
        TITLE = "Can Representation Learning for Multimodal Image Registration be
Improved by Supervision of Intermediate Layers?",
        BOOKTITLE = IbPRIA23,
        YEAR = "2023",
        PAGES = "261-275",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112383"}

@inproceedings{bb115794,
        AUTHOR = "Huang, Z.B. and Liu, J.Y. and Fan, X. and Liu, R.S. and Zhong, W. and Luo, Z.X.",
        TITLE = "ReCoNet: Recurrent Correction Network for Fast and Efficient
Multi-modality Image Fusion",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "XVIII:539-555",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112384"}

@inproceedings{bb115795,
        AUTHOR = "Duan, J.L. and Chen, L.Q. and Tran, S. and Yang, J.Y. and Xu, Y. and Zeng, B. and Chilimbi, T.",
        TITLE = "Multi-modal Alignment using Representation Codebook",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "15630-15639",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112385"}

@inproceedings{bb115796,
        AUTHOR = "Xue, Z.H. and Ren, S.C. and Gao, Z.Q. and Zhao, H.",
        TITLE = "Multimodal Knowledge Expansion",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "834-843",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112386"}

@inproceedings{bb115797,
        AUTHOR = "Zolfaghari, M. and Zhu, Y. and Gehler, P. and Brox, T.",
        TITLE = "CrossCLR: Cross-modal Contrastive Learning For Multi-modal Video
Representations",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "1430-1439",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112387"}

@inproceedings{bb115798,
        AUTHOR = "Piergiovanni, A.J. and Casser, V. and Ryoo, M.S. and Angelova, A.",
        TITLE = "4D-Net for Learned Multi-Modal Alignment",
        BOOKTITLE = ICCV21,
        YEAR = "2021",
        PAGES = "15415-15425",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112388"}

@inproceedings{bb115799,
        AUTHOR = "Yang, J.H. and Huang, Y. and Ma, Z.Y. and Wang, L.",
        TITLE = "CMF: Cascaded Multi-Model Fusion for Referring Image Segmentation",
        BOOKTITLE = ICIP21,
        YEAR = "2021",
        PAGES = "2289-2293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match-pl502mmf1.html#TT112389"}

Last update:Feb 26, 2026 at 10:58:24