@article{bb243300,
        AUTHOR = "Niu, K. and Huang, Y. and Wang, L.",
        TITLE = "Re-ranking image-text matching by adaptive metric fusion",
        JOURNAL = PR,
        VOLUME = "104",
        YEAR = "2020",
        PAGES = "107351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238214"}

@article{bb243301,
        AUTHOR = "Huang, Y. and Wang, Y.M. and Zeng, Y. and Huang, J.S. and Chai, Z.H. and Wang, L.",
        TITLE = "Unpaired Image-Text Matching via Multimodal Aligned Conceptual
Knowledge",
        JOURNAL = PAMI,
        VOLUME = "47",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "5160-5176",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238215"}

@article{bb243302,
        AUTHOR = "Wen, K.Y. and Gu, X.D. and Cheng, Q.R.",
        TITLE = "Learning Dual Semantic Relations With Graph Attention for Image-Text
Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "31",
        YEAR = "2021",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "2866-2879",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238216"}

@article{bb243303,
        AUTHOR = "Yang, S. and Li, Q. and Li, W.H. and Li, X.Y. and Liu, A.A.",
        TITLE = "Dual-Level Representation Enhancement on Characteristic and Context
for Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "8037-8050",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238217"}

@article{bb243304,
        AUTHOR = "Jing, Y. and Wang, W. and Wang, L. and Tan, T.N.",
        TITLE = "Learning Aligned Image-Text Representations Using Graph Attentive
Relational Network",
        JOURNAL = IP,
        VOLUME = "30",
        YEAR = "2021",
        PAGES = "1840-1852",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238218"}

@inproceedings{bb243305,
        AUTHOR = "Zhao, F. and Huang, Y.Z. and Wang, L. and Tan, T.N.",
        TITLE = "Deep Semantic Ranking Based Hashing for Multi-Label Image Retrieval",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "1556-1564",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238219"}

@article{bb243306,
        AUTHOR = "Lan, H. and Zhang, P.",
        TITLE = "Learning and Integrating Multi-Level Matching Features for Image-Text
Retrieval",
        JOURNAL = SPLetters,
        VOLUME = "29",
        YEAR = "2022",
        PAGES = "374-378",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238220"}

@article{bb243307,
        AUTHOR = "Wu, J. and Wu, C.L. and Lu, J. and Wang, L.Q. and Cui, X.R.",
        TITLE = "Region Reinforcement Network With Topic Constraint for Image-Text
Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "32",
        YEAR = "2022",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "388-397",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238221"}

@article{bb243308,
        AUTHOR = "Malali, N. and Keller, Y.",
        TITLE = "Learning to Embed Semantic Similarity for Joint Image-Text Retrieval",
        JOURNAL = PAMI,
        VOLUME = "44",
        YEAR = "2022",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "10252-10260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238222"}

@article{bb243309,
        AUTHOR = "Tian, M.X. and Wu, X.X. and Jia, Y.D.",
        TITLE = "Adaptive Latent Graph Representation Learning for Image-Text Matching",
        JOURNAL = IP,
        VOLUME = "32",
        YEAR = "2023",
        PAGES = "471-482",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238223"}

@article{bb243310,
        AUTHOR = "Li, K.P. and Zhang, Y.L. and Li, K. and Li, Y.Y. and Fu, Y.",
        TITLE = "Image-Text Embedding Learning via Visual and Textual Semantic
Reasoning",
        JOURNAL = PAMI,
        VOLUME = "45",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "641-656",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238224"}

@inproceedings{bb243311,
        AUTHOR = "Li, K.P. and Zhang, Y.L. and Li, K. and Li, Y.Y. and Fu, Y.",
        TITLE = "Visual Semantic Reasoning for Image-Text Matching",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4653-4661",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238225"}

@article{bb243312,
        AUTHOR = "Diao, H.W. and Zhang, Y. and Liu, W. and Ruan, X. and Lu, H.C.",
        TITLE = "Plug-and-Play Regulators for Image-Text Matching",
        JOURNAL = IP,
        VOLUME = "32",
        YEAR = "2023",
        PAGES = "2322-2334",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238226"}

@article{bb243313,
        AUTHOR = "Tian, Y.M. and Ding, A. and Wang, D. and Luo, X.M. and Wan, B. and Wang, Y.F.",
        TITLE = "Bi-Attention enhanced representation learning for image-text matching",
        JOURNAL = PR,
        VOLUME = "140",
        YEAR = "2023",
        PAGES = "109548",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238227"}

@article{bb243314,
        AUTHOR = "Zhang, K. and Mao, Z.D. and Liu, A.A. and Zhang, Y.D.",
        TITLE = "Unified Adaptive Relevance Distinguishable Attention Network for
Image-Text Matching",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "1320-1332",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238228"}

@article{bb243315,
        AUTHOR = "Xiong, G.X. and Meng, M. and Zhang, T.Z. and Zhang, D.M. and Zhang, Y.D.",
        TITLE = "Reference-Aware Adaptive Network for Image-Text Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "9678-9691",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238229"}

@article{bb243316,
        AUTHOR = "Liu, Z.J. and Chen, F.L. and Xu, J. and Pei, W.J. and Lu, G.M.",
        TITLE = "Image-Text Retrieval With Cross-Modal Semantic Importance Consistency",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "2465-2476",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238230"}

@article{bb243317,
        AUTHOR = "Shang, H. and Zhao, G.S. and Shi, J. and Qian, X.M.",
        TITLE = "A Multiview Text Imagination Network Based on Latent Alignment for
Image-Text Matching",
        JOURNAL = IEEE_Int_Sys,
        VOLUME = "38",
        YEAR = "2023",
        NUMBER = "3",
        MONTH = "May",
        PAGES = "41-50",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238231"}

@article{bb243318,
        AUTHOR = "Liu, C. and Zhang, Y.Q. and Wang, H.S. and Chen, W.H. and Wang, F. and Huang, Y. and Shen, Y.D. and Wang, L.",
        TITLE = "Efficient Token-Guided Image-Text Retrieval With Consistent
Multimodal Contrastive Training",
        JOURNAL = IP,
        VOLUME = "32",
        YEAR = "2023",
        PAGES = "3622-3633",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238232"}

@article{bb243319,
        AUTHOR = "Li, W.R. and Ma, Z.Y. and Deng, L.J. and Fan, X.P. and Tian, Y.H.",
        TITLE = "Neuron-Based Spiking Transmission and Reasoning Network for Robust
Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "3516-3528",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238233"}

@article{bb243320,
        AUTHOR = "Li, W.R. and Ma, Z.Y. and Shi, J.Q. and Fan, X.P.",
        TITLE = "The Style Transformer With Common Knowledge Optimization for
Image-Text Retrieval",
        JOURNAL = SPLetters,
        VOLUME = "30",
        YEAR = "2023",
        PAGES = "1197-1201",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238234"}

@article{bb243321,
        AUTHOR = "Zhu, H.G. and Zhang, C.J. and Wei, Y.C. and Huang, S. and Zhao, Y.",
        TITLE = "ESA: External Space Attention Aggregation for Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "33",
        YEAR = "2023",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "6131-6143",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238235"}

@article{bb243322,
        AUTHOR = "Li, Z. and Guo, C. and Feng, Z. and Hwang, J.N. and Du, Z.T.",
        TITLE = "Integrating Language Guidance Into Image-Text Matching for Correcting
False Negatives",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "103-116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238236"}

@article{bb243323,
        AUTHOR = "Zhang, Y. and Ji, Z. and Wang, D. and Pang, Y.W. and Li, X.L.",
        TITLE = "USER: Unified Semantic Enhancement With Momentum Contrast for
Image-Text Retrieval",
        JOURNAL = IP,
        VOLUME = "33",
        YEAR = "2024",
        PAGES = "595-609",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238237"}

@article{bb243324,
        AUTHOR = "Zhuang, J. and Yu, J. and Ding, Y. and Qu, X.Y. and Hu, Y.",
        TITLE = "Towards Fast and Accurate Image-Text Retrieval With Self-Supervised
Fine-Grained Alignment",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "1361-1372",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238238"}

@article{bb243325,
        AUTHOR = "Liu, X. and He, Y. and Cheung, Y.M. and Xu, X. and Wang, N.N.",
        TITLE = "Learning Relationship-Enhanced Semantic Graph for Fine-Grained
Image-Text Matching",
        JOURNAL = Cyber,
        VOLUME = "54",
        YEAR = "2024",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "948-961",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238239"}

@article{bb243326,
        AUTHOR = "Li, W.H. and Yang, S. and Li, Q. and Li, X.Y. and Liu, A.A.",
        TITLE = "Commonsense-Guided Semantic and Relational Consistencies for
Image-Text Retrieval",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "1867-1880",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238240"}

@article{bb243327,
        AUTHOR = "Wu, D.Q. and Li, H.H. and Gu, C. and Liu, H. and Xu, C. and Hou, Y.X. and Guo, L.",
        TITLE = "Feature First: Advancing Image-Text Retrieval Through Improved Visual
Features",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "3827-3841",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238241"}

@article{bb243328,
        AUTHOR = "Yang, R. and Wang, S. and Gu, Y. and Wang, J.H. and Sun, Y.Z. and Zhang, H. and Liao, Y. and Jiao, L.C.",
        TITLE = "Continual Learning for Cross-Modal Image-Text Retrieval Based on
Domain-Selective Attention",
        JOURNAL = PR,
        VOLUME = "149",
        YEAR = "2024",
        PAGES = "110273",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238242"}

@article{bb243329,
        AUTHOR = "Pan, R.J. and Yang, H. and Li, C. and Yang, J.H.",
        TITLE = "Joint Intra & Inter-Grained Reasoning: A New Look Into Semantic
Consistency of Image-Text Retrieval",
        JOURNAL = MultMed,
        VOLUME = "26",
        YEAR = "2024",
        PAGES = "4912-4925",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238243"}

@article{bb243330,
        AUTHOR = "Zhang, K. and Hu, B. and Zhang, H. and Li, Z. and Mao, Z.D.",
        TITLE = "Enhanced Semantic Similarity Learning Framework for Image-Text
Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "2973-2988",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238244"}

@inproceedings{bb243331,
        AUTHOR = "Fu, Z.R. and Mao, Z.D. and Song, Y. and Zhang, Y.D.",
        TITLE = "Learning Semantic Relationship among Instances for Image-Text
Matching",
        BOOKTITLE = CVPR23,
        YEAR = "2023",
        PAGES = "15159-15168",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238245"}

@article{bb243332,
        AUTHOR = "Diao, H. and Zhang, Y. and Gao, S. and Ruan, X. and Lu, H.C.",
        TITLE = "Deep Boosting Learning:
A Brand-New Cooperative Approach for Image-Text Matching",
        JOURNAL = IP,
        VOLUME = "33",
        YEAR = "2024",
        PAGES = "3341-3352",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238246"}

@inproceedings{bb243333,
        AUTHOR = "Zhang, Y. and Lu, H.C.",
        TITLE = "Deep Cross-Modal Projection Learning for Image-Text Matching",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "I: 707-723",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238247"}

@article{bb243334,
        AUTHOR = "Cao, M. and Bai, Y. and Cao, Z.Q. and Nie, L.Q. and Zhang, M.",
        TITLE = "Efficient Image-Text Retrieval via Keyword-Guided Pre-Screening",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "5132-5145",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238248"}

@article{bb243335,
        AUTHOR = "Li, Z. and Zhang, L. and Zhang, K. and Zhang, Y.D. and Mao, Z.D.",
        TITLE = "Improving Image-Text Matching With Bidirectional Consistency of
Cross-Modal Alignment",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "6590-6607",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238249"}

@article{bb243336,
        AUTHOR = "Li, Z. and Zhang, L. and Zhang, K. and Zhang, Y.D. and Mao, Z.D.",
        TITLE = "Fast, Accurate, and Lightweight Memory-Enhanced Embedding Learning
Framework for Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "6542-6558",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238250"}

@article{bb243337,
        AUTHOR = "Cui, Z. and Hu, Y.L. and Sun, Y.F. and Yin, B.C.",
        TITLE = "Context-aware relation enhancement and similarity reasoning for
image-text retrieval",
        JOURNAL = IET-CV,
        VOLUME = "18",
        YEAR = "2024",
        NUMBER = "5",
        PAGES = "652-665",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238251"}

@article{bb243338,
        AUTHOR = "Pan, Z.X. and Mao, Y.C. and Xiong, L. and Pang, T.F. and Ping, P.",
        TITLE = "MFAE: Multimodal Fusion and Alignment for Entity-level Disinformation
Detection",
        JOURNAL = PRL,
        VOLUME = "184",
        YEAR = "2024",
        PAGES = "59-65",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238252"}

@article{bb243339,
        AUTHOR = "Pu, X. and Wang, Z.W. and Yuan, L. and Wu, Y. and Jing, L.P. and Gao, X.B.",
        TITLE = "GADNet: Improving image-text matching via graph-based aggregation and
disentanglement",
        JOURNAL = PR,
        VOLUME = "157",
        YEAR = "2025",
        PAGES = "110900",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238253"}

@article{bb243340,
        AUTHOR = "Pu, X. and Yang, P. and Yuan, L. and Gao, X.B.",
        TITLE = "Improving Image-Text Matching by Integrating Word Sense
Disambiguation",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "2695-2699",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238254"}

@article{bb243341,
        AUTHOR = "Li, W.R. and Xiong, R.Q. and Fan, X.P.",
        TITLE = "Multi-Layer Probabilistic Association Reasoning Network for
Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "34",
        YEAR = "2024",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "9706-9717",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238255"}

@article{bb243342,
        AUTHOR = "Tian, M.X. and Yang, S. and Wu, X.X. and Jia, Y.D.",
        TITLE = "Source-Free Image-Text Matching via Uncertainty-Aware Learning",
        JOURNAL = SPLetters,
        VOLUME = "31",
        YEAR = "2024",
        PAGES = "3059-3063",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238256"}

@article{bb243343,
        AUTHOR = "Wang, D. and Tian, J. and Liang, X. and Tian, Y.M. and He, L.H.",
        TITLE = "Global-aware Fragment Representation Aggregation Network for
image-text retrieval",
        JOURNAL = PR,
        VOLUME = "159",
        YEAR = "2025",
        PAGES = "111085",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238257"}

@article{bb243344,
        AUTHOR = "Ke, X. and Chen, B.T. and Yang, X. and Cai, Y.H. and Liu, H. and Guo, W.Z.",
        TITLE = "Cross-modal independent matching network for image-text retrieval",
        JOURNAL = PR,
        VOLUME = "159",
        YEAR = "2025",
        PAGES = "111096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238258"}

@article{bb243345,
        AUTHOR = "Li, Z. and Guo, C. and Wang, X. and Feng, Z. and Du, Z.T.",
        TITLE = "Selectively Hard Negative Mining for Alleviating Gradient Vanishing
in Image-Text Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "1921-1935",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238259"}

@article{bb243346,
        AUTHOR = "Yang, X.Y. and Li, C. and Wang, Z.M. and Xie, H. and Mao, J. and Yin, G.Q.",
        TITLE = "Remote Sensing Cross-Modal Text-Image Retrieval Based on Attention
Correction and Filtering",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "3",
        PAGES = "503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238260"}

@article{bb243347,
        AUTHOR = "Wu, D.Q. and Li, H.H. and Gu, C. and Guo, L. and Liu, H.",
        TITLE = "Dual Stream Relation Learning Network for Image-Text Retrieval",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "1551-1565",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238261"}

@article{bb243348,
        AUTHOR = "Liu, Z. and Xu, J.H. and Gao, S.S. and Chen, Z.",
        TITLE = "CSA: Cross-scale alignment with adaptive semantic aggregation and
filter for image-text retrieval",
        JOURNAL = PR,
        VOLUME = "165",
        YEAR = "2025",
        PAGES = "111647",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238262"}

@article{bb243349,
        AUTHOR = "Zhang, Q. and Wang, D. and Yu, X.",
        TITLE = "RLita: A Region-Level Image-Text Alignment Method for Remote Sensing
Foundation Model",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "10",
        PAGES = "1661",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238263"}

@article{bb243350,
        AUTHOR = "Wen, Z.T. and Liu, J.H. and Zhang, H. and Zuo, F.Y.",
        TITLE = "Exploring Fine-Grained Visual-Text Feature Alignment With Prompt
Tuning for Domain-Adaptive Object Detection",
        JOURNAL = Cyber,
        VOLUME = "55",
        YEAR = "2025",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "3220-3233",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238264"}

@article{bb243351,
        AUTHOR = "Guan, J.H. and Shu, Y. and Li, W. and Song, Z. and Zhang, Y.C.",
        TITLE = "PR-CLIP: Cross-Modal Positional Reconstruction for Remote Sensing
Image-Text Retrieval",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "13",
        PAGES = "2117",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238265"}

@article{bb243352,
        AUTHOR = "Song, Z. and Shu, Y. and Li, W. and Guan, J.H. and Zhang, Y.C.",
        TITLE = "Towards Discriminative and Consistent Cross-Modal Alignment for
Remote Sensing Image-Text Retrieval",
        JOURNAL = RS,
        VOLUME = "18",
        YEAR = "2026",
        NUMBER = "4",
        PAGES = "662",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238266"}

@article{bb243353,
        AUTHOR = "Zhao, H. and Li, Z.Y. and Wang, S. and Zhang, Z.X. and Li, K.Q.",
        TITLE = "Robust Hashing With Bilinear Drift for Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "7642-7654",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238267"}

@article{bb243354,
        AUTHOR = "Wang, P.Z. and Zhang, L. and Mao, Z.D. and Lyu, N. and Zhang, Y.D.",
        TITLE = "Matryoshka Learning With Metric Transfer for Image-Text Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "9502-9516",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238268"}

@article{bb243355,
        AUTHOR = "Koo, H. and Shin, J. and Kim, E.",
        TITLE = "Dual-branch scale disentanglement for text-video retrieval",
        JOURNAL = PRL,
        VOLUME = "196",
        YEAR = "2025",
        PAGES = "296-302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238269"}

@article{bb243356,
        AUTHOR = "Zhou, J. and Wang, M.",
        TITLE = "Unified learning for image-text alignment via multi-scale feature
fusion",
        JOURNAL = CVIU,
        VOLUME = "260",
        YEAR = "2025",
        PAGES = "104468",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238270"}

@article{bb243357,
        AUTHOR = "Wen, J. and Chen, Y.F. and Shi, R.Q. and Ji, W. and Yang, M.L. and Gao, D.F. and Yuan, J.S. and Zimmermann, R.",
        TITLE = "HOVER: Hyperbolic Video-Text Retrieval",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "6192-6203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238271"}

@article{bb243358,
        AUTHOR = "Fang, J.Y. and Zhu, B. and Yuan, J.L. and Chen, Y.Y. and Tang, M. and Wang, J.Q.",
        TITLE = "AMITA: Attribute-Guided Masked Image-Text Alignment for Multi-Label
Image Representation",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "11432-11447",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238272"}

@article{bb243359,
        AUTHOR = "Ji, L.L. and Liu, L.",
        TITLE = "Multi-Scale Feature Fusion Based on Piecewise Polynomial Activation
Function for Image-Text Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "35",
        YEAR = "2025",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "11627-11640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238273"}

@article{bb243360,
        AUTHOR = "Chen, R. and Su, T. and Wang, H. and Ni, Z.K.",
        TITLE = "Similarity Shuffled Criss-Cross Transformer With Angle Loss for
Image-Text Matching",
        JOURNAL = MultMed,
        VOLUME = "27",
        YEAR = "2025",
        PAGES = "9723-9734",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238274"}

@article{bb243361,
        AUTHOR = "Chen, D. and Wang, Y.T. and Xie, Y.Z. and Chen, S.Y. and Peng, W.L. and Tang, M. and Fang, M. and Chen, C.L.P. and Li, P. and Zhang, W.",
        TITLE = "Intra-modal consistency for image-text retrieval through soft-label
distillation",
        JOURNAL = PR,
        VOLUME = "173",
        YEAR = "2026",
        PAGES = "112817",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238275"}

@article{bb243362,
        AUTHOR = "Shi, Z.X. and Ding, Y. and Dong, J.Y. and Zhang, T.Z.",
        TITLE = "Beyond One and Two Tower: Cross-Modal Consensus Learning for
Image-Text Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "2581-2593",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238276"}

@article{bb243363,
        AUTHOR = "Wang, H.C. and Liu, L. and Zhang, H.X. and Zhu, L. and Chang, X.J. and Du, H.",
        TITLE = "VisualRAG: Knowledge-Guided Retrieval Augmentation for Image-Text
Matching",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "1234-1248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238277"}

@article{bb243364,
        AUTHOR = "Zhang, D.L. and Wang, Z.W. and Wu, X.J. and Kittler, J.V.",
        TITLE = "HACG: Leveraging Hierarchical Alignment and Caption Generation for
Text-Video Retrieval",
        JOURNAL = IJCV,
        VOLUME = "134",
        YEAR = "2026",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "93",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238278"}

@article{bb243365,
        AUTHOR = "Zhang, B. and Wu, H.",
        TITLE = "Test-Time Candidate-Aware Dual Refinement for Remote Sensing
Image-Text Retrieval",
        JOURNAL = RS,
        VOLUME = "18",
        YEAR = "2026",
        NUMBER = "9",
        PAGES = "1389",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238279"}

@article{bb243366,
        AUTHOR = "Wang, Z. and Xu, X. and Zhu, L. and Song, J.K. and Yang, Y. and Shen, H.T.",
        TITLE = "Distribution-to-Points Matching for Image Text Retrieval",
        JOURNAL = PAMI,
        VOLUME = "48",
        YEAR = "2026",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "7097-7111",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238280"}

@article{bb243367,
        AUTHOR = "Huang, J. and Chen, Y.X. and Du, C. and Xiong, S.W. and Lu, X.Q.",
        TITLE = "ReCoTR: Reducing Semantic Cognitive Shift via Dual-Consensus Token
Compression for Remote Sensing Image-Text Retrieval",
        JOURNAL = IP,
        VOLUME = "35",
        YEAR = "2026",
        PAGES = "5017-5031",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238281"}

@article{bb243368,
        AUTHOR = "Wang, K. and Hu, Y.P. and Liu, H. and Jie, L.R. and Nie, L.Q.",
        TITLE = "Redundancy Mitigation: Toward Accurate and Efficient Image-Text
Retrieval",
        JOURNAL = CirSysVideo,
        VOLUME = "36",
        YEAR = "2026",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "7155-7167",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238282"}

@inproceedings{bb243369,
        AUTHOR = "Vongala, M.R. and Srivastava, S. and Kosecka, J.",
        TITLE = "Compositional Image-Text Matching and Retrieval by Grounding Entities",
        BOOKTITLE = "MULA25",
        YEAR = "2025",
        PAGES = "241-250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238283"}

@inproceedings{bb243370,
        AUTHOR = "Zhang, Z.C. and Li, X.Y. and Sun, W. and Zhang, Z.C. and Li, Y.H. and Liu, X.H. and Zhai, G.T.",
        TITLE = "Leveraging Multimodal Large Language Models for Joint Discrete and
Continuous Evaluation in Text-to-Image Alignment",
        BOOKTITLE = NTIRE25,
        YEAR = "2025",
        PAGES = "968-977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238284"}

@inproceedings{bb243371,
        AUTHOR = "Zhang, Z.J. and Zheng, X.H. and Wu, X.C. and Peng, C. and Cao, X.Z.",
        TITLE = "Tokenfocus-VQA: Enhancing Text-to-Image Alignment with Position-Aware
Focus and Multi-Perspective Aggregations on LVLMs",
        BOOKTITLE = NTIRE25,
        YEAR = "2025",
        PAGES = "1270-1279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238285"}

@inproceedings{bb243372,
        AUTHOR = "Yue, X. and Sun, J. and Lu, J. and Yao, L.C. and XIA, F. and Wang, T.Y. and Rao, F.Y. and LYU, J. and Deng, Y.",
        TITLE = "Instruction-Augmented Multimodal Alignment for Image-Text and Element
Matching",
        BOOKTITLE = NTIRE25,
        YEAR = "2025",
        PAGES = "1370-1379",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238286"}

@inproceedings{bb243373,
        AUTHOR = "Lai, H. and Xiong, G.X. and Mai, H.Y. and Liu, X. and Zhang, T.Z.",
        TITLE = "Rethinking Noisy Video-Text Retrieval via Relation-aware Alignment",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "9231-9241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238287"}

@inproceedings{bb243374,
        AUTHOR = "Kim, D. and Piergiovanni, A. and Mallya, G. and Angelova, A.",
        TITLE = "VideoComp: Advancing Fine-Grained Compositional and Temporal
Alignment in Video-Text Models",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "29060-29070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238288"}

@inproceedings{bb243375,
        AUTHOR = "Shen, L. and Gong, G.Q. and Hao, T.X. and He, T. and Zhang, Y.F. and Liu, P.Z. and Zhao, S.C. and Han, J.G. and Ding, G.",
        TITLE = "DiscoVLA: Discrepancy Reduction in Vision, Language, and Alignment
for Parameter-Efficient Video-Text Retrieval",
        BOOKTITLE = CVPR25,
        YEAR = "2025",
        PAGES = "19702-19712",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238289"}

@inproceedings{bb243376,
        AUTHOR = "Jin, Z.X. and Xu, X.W. and Wang, X.D.",
        TITLE = "MADA:Multi-Window Attention and Dual-Alignment for Image-Text
Retrieval",
        BOOKTITLE = ICIVC24,
        YEAR = "2024",
        PAGES = "240-245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238290"}

@inproceedings{bb243377,
        AUTHOR = "Xie, C.W. and Sun, S.Y. and Zhao, L.M. and Li, P. and Ma, S. and Zheng, Y.",
        TITLE = "Fuseteacher: Modality-fused Encoders are Strong Vision Supervisors",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XLVIII: 287-304",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238291"}

@inproceedings{bb243378,
        AUTHOR = "Kim, W. and Chun, S. and Kim, T. and Han, D.Y. and Yun, S.",
        TITLE = "HYPE: Hyperbolic Entailment Filtering for Underspecified Images and
Texts",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XL: 247-265",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238292"}

@inproceedings{bb243379,
        AUTHOR = "Sogi, N. and Shibata, T. and Terao, M.",
        TITLE = "Object-aware Query Perturbation for Cross-modal Image-text Retrieval",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LXXIX: 447-464",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238293"}

@inproceedings{bb243380,
        AUTHOR = "Alper, M. and Averbuch Elor, H.",
        TITLE = "Emergent Visual-semantic Hierarchies in Image-text Representations",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LII: 220-238",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238294"}

@inproceedings{bb243381,
        AUTHOR = "Gordon, B. and Bitton, Y. and Shafir, Y. and Garg, R. and Chen, X. and Lischinski, D. and Cohen Or, D. and Szpektor, I.",
        TITLE = "Mismatch Quest: Visual and Textual Feedback for Image-Text Misalignment",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "LVII: 310-328",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238295"}

@inproceedings{bb243382,
        AUTHOR = "Hua, H. and Shi, J. and Kafle, K. and Jenni, S. and Zhang, D. and Collomosse, J. and Cohen, S. and Luo, J.B.",
        TITLE = "Finematch: Aspect-based Fine-grained Image and Text Mismatch Detection
and Correction",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "IX: 474-491",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238296"}

@inproceedings{bb243383,
        AUTHOR = "Li, Y.H. and Liu, H.T. and Cai, M. and Li, Y.J. and Shechtman, E. and Lin, Z. and Lee, Y.J. and Singh, K.K.",
        TITLE = "Removing Distributional Discrepancies in Captions Improves Image-Text
Alignment",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XXI: 405-422",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238297"}

@inproceedings{bb243384,
        AUTHOR = "Ma, W. and Li, K. and Jiang, Z. and Meshry, M. and Liu, Q.H. and Wang, H.Y. and Hane, C. and Yuille, A.L.",
        TITLE = "Rethinking Video-text Understanding: Retrieval from Counterfactually
Augmented Data",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "XIII: 254-269",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238298"}

@inproceedings{bb243385,
        AUTHOR = "Zhang, W. and Xu, X.W. and Tao, Y. and Wang, X.D. and Wang, C.L. and Wei, Z.M.",
        TITLE = "Bi-Directional Image-Text Retrieval With Position Attention and
Similarity Filtering",
        BOOKTITLE = ICIVC22,
        YEAR = "2022",
        PAGES = "635-640",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238299"}

@inproceedings{bb243386,
        AUTHOR = "Li, Z. and Nian, X.H. and Pan, C. and Yang, D. and Xiong, H.Y. and Wang, H.B.",
        TITLE = "Relation Graph Reasoning for Image-Text Matching",
        BOOKTITLE = ICIVC22,
        YEAR = "2022",
        PAGES = "319-324",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238300"}

@inproceedings{bb243387,
        AUTHOR = "Zhang, K. and Mao, Z.D. and Wang, Q. and Zhang, Y.D.",
        TITLE = "Negative-Aware Attention Framework for Image-Text Matching",
        BOOKTITLE = CVPR22,
        YEAR = "2022",
        PAGES = "15640-15649",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238301"}

@inproceedings{bb243388,
        AUTHOR = "Long, S. and Han, S.C. and Wan, X.J. and Poon, J.",
        TITLE = "GraDual: Graph-based Dual-modal Representation for Image-Text
Matching",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "2463-2472",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238302"}

@inproceedings{bb243389,
        AUTHOR = "Biten, A.F. and Mafla, A. and Gomez, L. and Karatzas, D.",
        TITLE = "Is An Image Worth Five Sentences? A New Look into Semantics for
Image-Text Matching",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "2483-2492",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238303"}

@inproceedings{bb243390,
        AUTHOR = "Mithun, N.C. and Pasricha, R. and Papalexakis, E. and Roy Chowdhury, A.K.",
        TITLE = "Webly Supervised Image-Text Embedding with Noisy Tag Refinement",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "7454-7461",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238304"}

@inproceedings{bb243391,
        AUTHOR = "Chen, J.A. and Zhang, L. and Wang, Q. and Bai, C. and Kpalma, K.",
        TITLE = "Intra-Modal Constraint Loss for Image-Text Retrieval",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "4023-4027",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238305"}

@inproceedings{bb243392,
        AUTHOR = "Liu, Y. and Wang, H.Q. and Meng, F.Y. and Liu, M.Y. and Liu, H.",
        TITLE = "Attend, Correct and Focus: A Bidirectional Correct Attention Network
for Image-Text Matching",
        BOOKTITLE = ICIP21,
        YEAR = "2021",
        PAGES = "2673-2677",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238306"}

@inproceedings{bb243393,
        AUTHOR = "Yang, S.T. and Huang, K.H. and Howe, B.",
        TITLE = "JECL: Joint Embedding and Cluster Learning for Image-Text Pairs",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "8344-8351",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238307"}

@inproceedings{bb243394,
        AUTHOR = "Mikriukov, G. and Ravanbakhsh, M. and Demir, B.",
        TITLE = "An Unsupervised Cross-Modal Hashing Method Robust to Noisy Training
Image-Text Correspondences in Remote Sensing",
        BOOKTITLE = ICIP22,
        YEAR = "2022",
        PAGES = "2556-2560",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238308"}

@inproceedings{bb243395,
        AUTHOR = "Anwaar, M.U. and Labintcev, E. and Kleinsteuber, M.",
        TITLE = "Compositional Learning of Image-Text Query for Image Retrieval",
        BOOKTITLE = WACV21,
        YEAR = "2021",
        PAGES = "1139-1148",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238309"}

@inproceedings{bb243396,
        AUTHOR = "Messina, N. and Falchi, F. and Esuli, A. and Amato, G.",
        TITLE = "Transformer Reasoning Network for Image-Text Matching and Retrieval",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "5222-5229",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238310"}

@inproceedings{bb243397,
        AUTHOR = "Zhang, Q. and Lei, Z. and Zhang, Z.X. and Li, S.Z.",
        TITLE = "Context-Aware Attention Network for Image-Text Retrieval",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "3533-3542",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238311"}

@inproceedings{bb243398,
        AUTHOR = "Chen, Y.C. and Li, L.J. and Yu, L.C. and El Kholy, A. and Ahmed, F. and Gan, Z. and Cheng, Y. and Liu, J.J.",
        TITLE = "Uniter: Universal Image-Text Representation Learning",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXX: 104-120",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238312"}

@inproceedings{bb243399,
        AUTHOR = "Wang, H.R. and Zhang, Y. and Ji, Z. and Pang, Y.W. and Ma, L.",
        TITLE = "Consensus-aware Visual-semantic Embedding for Image-Text Matching",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXIV:18-34",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238313"}

Last update:Jun 4, 2026 at 16:38:45