@article{bb243300,
AUTHOR = "Niu, K. and Huang, Y. and Wang, L.",
TITLE = "Re-ranking image-text matching by adaptive metric fusion",
JOURNAL = PR,
VOLUME = "104",
YEAR = "2020",
PAGES = "107351",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238214"}
@article{bb243301,
AUTHOR = "Huang, Y. and Wang, Y.M. and Zeng, Y. and Huang, J.S. and Chai, Z.H. and Wang, L.",
TITLE = "Unpaired Image-Text Matching via Multimodal Aligned Conceptual
Knowledge",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "7",
MONTH = "July",
PAGES = "5160-5176",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238215"}
@article{bb243302,
AUTHOR = "Wen, K.Y. and Gu, X.D. and Cheng, Q.R.",
TITLE = "Learning Dual Semantic Relations With Graph Attention for Image-Text
Matching",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "7",
MONTH = "July",
PAGES = "2866-2879",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238216"}
@article{bb243303,
AUTHOR = "Yang, S. and Li, Q. and Li, W.H. and Li, X.Y. and Liu, A.A.",
TITLE = "Dual-Level Representation Enhancement on Characteristic and Context
for Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "11",
MONTH = "November",
PAGES = "8037-8050",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238217"}
@article{bb243304,
AUTHOR = "Jing, Y. and Wang, W. and Wang, L. and Tan, T.N.",
TITLE = "Learning Aligned Image-Text Representations Using Graph Attentive
Relational Network",
JOURNAL = IP,
VOLUME = "30",
YEAR = "2021",
PAGES = "1840-1852",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238218"}
@inproceedings{bb243305,
AUTHOR = "Zhao, F. and Huang, Y.Z. and Wang, L. and Tan, T.N.",
TITLE = "Deep Semantic Ranking Based Hashing for Multi-Label Image Retrieval",
BOOKTITLE = CVPR15,
YEAR = "2015",
PAGES = "1556-1564",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238219"}
@article{bb243306,
AUTHOR = "Lan, H. and Zhang, P.",
TITLE = "Learning and Integrating Multi-Level Matching Features for Image-Text
Retrieval",
JOURNAL = SPLetters,
VOLUME = "29",
YEAR = "2022",
PAGES = "374-378",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238220"}
@article{bb243307,
AUTHOR = "Wu, J. and Wu, C.L. and Lu, J. and Wang, L.Q. and Cui, X.R.",
TITLE = "Region Reinforcement Network With Topic Constraint for Image-Text
Matching",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "1",
MONTH = "January",
PAGES = "388-397",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238221"}
@article{bb243308,
AUTHOR = "Malali, N. and Keller, Y.",
TITLE = "Learning to Embed Semantic Similarity for Joint Image-Text Retrieval",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "12",
MONTH = "December",
PAGES = "10252-10260",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238222"}
@article{bb243309,
AUTHOR = "Tian, M.X. and Wu, X.X. and Jia, Y.D.",
TITLE = "Adaptive Latent Graph Representation Learning for Image-Text Matching",
JOURNAL = IP,
VOLUME = "32",
YEAR = "2023",
PAGES = "471-482",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238223"}
@article{bb243310,
AUTHOR = "Li, K.P. and Zhang, Y.L. and Li, K. and Li, Y.Y. and Fu, Y.",
TITLE = "Image-Text Embedding Learning via Visual and Textual Semantic
Reasoning",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "1",
MONTH = "January",
PAGES = "641-656",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238224"}
@inproceedings{bb243311,
AUTHOR = "Li, K.P. and Zhang, Y.L. and Li, K. and Li, Y.Y. and Fu, Y.",
TITLE = "Visual Semantic Reasoning for Image-Text Matching",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "4653-4661",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238225"}
@article{bb243312,
AUTHOR = "Diao, H.W. and Zhang, Y. and Liu, W. and Ruan, X. and Lu, H.C.",
TITLE = "Plug-and-Play Regulators for Image-Text Matching",
JOURNAL = IP,
VOLUME = "32",
YEAR = "2023",
PAGES = "2322-2334",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238226"}
@article{bb243313,
AUTHOR = "Tian, Y.M. and Ding, A. and Wang, D. and Luo, X.M. and Wan, B. and Wang, Y.F.",
TITLE = "Bi-Attention enhanced representation learning for image-text matching",
JOURNAL = PR,
VOLUME = "140",
YEAR = "2023",
PAGES = "109548",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238227"}
@article{bb243314,
AUTHOR = "Zhang, K. and Mao, Z.D. and Liu, A.A. and Zhang, Y.D.",
TITLE = "Unified Adaptive Relevance Distinguishable Attention Network for
Image-Text Matching",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "1320-1332",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238228"}
@article{bb243315,
AUTHOR = "Xiong, G.X. and Meng, M. and Zhang, T.Z. and Zhang, D.M. and Zhang, Y.D.",
TITLE = "Reference-Aware Adaptive Network for Image-Text Matching",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "10",
MONTH = "October",
PAGES = "9678-9691",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238229"}
@article{bb243316,
AUTHOR = "Liu, Z.J. and Chen, F.L. and Xu, J. and Pei, W.J. and Lu, G.M.",
TITLE = "Image-Text Retrieval With Cross-Modal Semantic Importance Consistency",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "5",
MONTH = "May",
PAGES = "2465-2476",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238230"}
@article{bb243317,
AUTHOR = "Shang, H. and Zhao, G.S. and Shi, J. and Qian, X.M.",
TITLE = "A Multiview Text Imagination Network Based on Latent Alignment for
Image-Text Matching",
JOURNAL = IEEE_Int_Sys,
VOLUME = "38",
YEAR = "2023",
NUMBER = "3",
MONTH = "May",
PAGES = "41-50",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238231"}
@article{bb243318,
AUTHOR = "Liu, C. and Zhang, Y.Q. and Wang, H.S. and Chen, W.H. and Wang, F. and Huang, Y. and Shen, Y.D. and Wang, L.",
TITLE = "Efficient Token-Guided Image-Text Retrieval With Consistent
Multimodal Contrastive Training",
JOURNAL = IP,
VOLUME = "32",
YEAR = "2023",
PAGES = "3622-3633",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238232"}
@article{bb243319,
AUTHOR = "Li, W.R. and Ma, Z.Y. and Deng, L.J. and Fan, X.P. and Tian, Y.H.",
TITLE = "Neuron-Based Spiking Transmission and Reasoning Network for Robust
Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "7",
MONTH = "July",
PAGES = "3516-3528",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238233"}
@article{bb243320,
AUTHOR = "Li, W.R. and Ma, Z.Y. and Shi, J.Q. and Fan, X.P.",
TITLE = "The Style Transformer With Common Knowledge Optimization for
Image-Text Retrieval",
JOURNAL = SPLetters,
VOLUME = "30",
YEAR = "2023",
PAGES = "1197-1201",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238234"}
@article{bb243321,
AUTHOR = "Zhu, H.G. and Zhang, C.J. and Wei, Y.C. and Huang, S. and Zhao, Y.",
TITLE = "ESA: External Space Attention Aggregation for Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "10",
MONTH = "October",
PAGES = "6131-6143",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238235"}
@article{bb243322,
AUTHOR = "Li, Z. and Guo, C. and Feng, Z. and Hwang, J.N. and Du, Z.T.",
TITLE = "Integrating Language Guidance Into Image-Text Matching for Correcting
False Negatives",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "103-116",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238236"}
@article{bb243323,
AUTHOR = "Zhang, Y. and Ji, Z. and Wang, D. and Pang, Y.W. and Li, X.L.",
TITLE = "USER: Unified Semantic Enhancement With Momentum Contrast for
Image-Text Retrieval",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "595-609",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238237"}
@article{bb243324,
AUTHOR = "Zhuang, J. and Yu, J. and Ding, Y. and Qu, X.Y. and Hu, Y.",
TITLE = "Towards Fast and Accurate Image-Text Retrieval With Self-Supervised
Fine-Grained Alignment",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "1361-1372",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238238"}
@article{bb243325,
AUTHOR = "Liu, X. and He, Y. and Cheung, Y.M. and Xu, X. and Wang, N.N.",
TITLE = "Learning Relationship-Enhanced Semantic Graph for Fine-Grained
Image-Text Matching",
JOURNAL = Cyber,
VOLUME = "54",
YEAR = "2024",
NUMBER = "2",
MONTH = "February",
PAGES = "948-961",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238239"}
@article{bb243326,
AUTHOR = "Li, W.H. and Yang, S. and Li, Q. and Li, X.Y. and Liu, A.A.",
TITLE = "Commonsense-Guided Semantic and Relational Consistencies for
Image-Text Retrieval",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "1867-1880",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238240"}
@article{bb243327,
AUTHOR = "Wu, D.Q. and Li, H.H. and Gu, C. and Liu, H. and Xu, C. and Hou, Y.X. and Guo, L.",
TITLE = "Feature First: Advancing Image-Text Retrieval Through Improved Visual
Features",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "3827-3841",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238241"}
@article{bb243328,
AUTHOR = "Yang, R. and Wang, S. and Gu, Y. and Wang, J.H. and Sun, Y.Z. and Zhang, H. and Liao, Y. and Jiao, L.C.",
TITLE = "Continual Learning for Cross-Modal Image-Text Retrieval Based on
Domain-Selective Attention",
JOURNAL = PR,
VOLUME = "149",
YEAR = "2024",
PAGES = "110273",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238242"}
@article{bb243329,
AUTHOR = "Pan, R.J. and Yang, H. and Li, C. and Yang, J.H.",
TITLE = "Joint Intra & Inter-Grained Reasoning: A New Look Into Semantic
Consistency of Image-Text Retrieval",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "4912-4925",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238243"}
@article{bb243330,
AUTHOR = "Zhang, K. and Hu, B. and Zhang, H. and Li, Z. and Mao, Z.D.",
TITLE = "Enhanced Semantic Similarity Learning Framework for Image-Text
Matching",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "4",
MONTH = "April",
PAGES = "2973-2988",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238244"}
@inproceedings{bb243331,
AUTHOR = "Fu, Z.R. and Mao, Z.D. and Song, Y. and Zhang, Y.D.",
TITLE = "Learning Semantic Relationship among Instances for Image-Text
Matching",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "15159-15168",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238245"}
@article{bb243332,
AUTHOR = "Diao, H. and Zhang, Y. and Gao, S. and Ruan, X. and Lu, H.C.",
TITLE = "Deep Boosting Learning:
A Brand-New Cooperative Approach for Image-Text Matching",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "3341-3352",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238246"}
@inproceedings{bb243333,
AUTHOR = "Zhang, Y. and Lu, H.C.",
TITLE = "Deep Cross-Modal Projection Learning for Image-Text Matching",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "I: 707-723",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238247"}
@article{bb243334,
AUTHOR = "Cao, M. and Bai, Y. and Cao, Z.Q. and Nie, L.Q. and Zhang, M.",
TITLE = "Efficient Image-Text Retrieval via Keyword-Guided Pre-Screening",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "6",
MONTH = "June",
PAGES = "5132-5145",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238248"}
@article{bb243335,
AUTHOR = "Li, Z. and Zhang, L. and Zhang, K. and Zhang, Y.D. and Mao, Z.D.",
TITLE = "Improving Image-Text Matching With Bidirectional Consistency of
Cross-Modal Alignment",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "7",
MONTH = "July",
PAGES = "6590-6607",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238249"}
@article{bb243336,
AUTHOR = "Li, Z. and Zhang, L. and Zhang, K. and Zhang, Y.D. and Mao, Z.D.",
TITLE = "Fast, Accurate, and Lightweight Memory-Enhanced Embedding Learning
Framework for Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "7",
MONTH = "July",
PAGES = "6542-6558",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238250"}
@article{bb243337,
AUTHOR = "Cui, Z. and Hu, Y.L. and Sun, Y.F. and Yin, B.C.",
TITLE = "Context-aware relation enhancement and similarity reasoning for
image-text retrieval",
JOURNAL = IET-CV,
VOLUME = "18",
YEAR = "2024",
NUMBER = "5",
PAGES = "652-665",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238251"}
@article{bb243338,
AUTHOR = "Pan, Z.X. and Mao, Y.C. and Xiong, L. and Pang, T.F. and Ping, P.",
TITLE = "MFAE: Multimodal Fusion and Alignment for Entity-level Disinformation
Detection",
JOURNAL = PRL,
VOLUME = "184",
YEAR = "2024",
PAGES = "59-65",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238252"}
@article{bb243339,
AUTHOR = "Pu, X. and Wang, Z.W. and Yuan, L. and Wu, Y. and Jing, L.P. and Gao, X.B.",
TITLE = "GADNet: Improving image-text matching via graph-based aggregation and
disentanglement",
JOURNAL = PR,
VOLUME = "157",
YEAR = "2025",
PAGES = "110900",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238253"}
@article{bb243340,
AUTHOR = "Pu, X. and Yang, P. and Yuan, L. and Gao, X.B.",
TITLE = "Improving Image-Text Matching by Integrating Word Sense
Disambiguation",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "2695-2699",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238254"}
@article{bb243341,
AUTHOR = "Li, W.R. and Xiong, R.Q. and Fan, X.P.",
TITLE = "Multi-Layer Probabilistic Association Reasoning Network for
Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "10",
MONTH = "October",
PAGES = "9706-9717",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238255"}
@article{bb243342,
AUTHOR = "Tian, M.X. and Yang, S. and Wu, X.X. and Jia, Y.D.",
TITLE = "Source-Free Image-Text Matching via Uncertainty-Aware Learning",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "3059-3063",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238256"}
@article{bb243343,
AUTHOR = "Wang, D. and Tian, J. and Liang, X. and Tian, Y.M. and He, L.H.",
TITLE = "Global-aware Fragment Representation Aggregation Network for
image-text retrieval",
JOURNAL = PR,
VOLUME = "159",
YEAR = "2025",
PAGES = "111085",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238257"}
@article{bb243344,
AUTHOR = "Ke, X. and Chen, B.T. and Yang, X. and Cai, Y.H. and Liu, H. and Guo, W.Z.",
TITLE = "Cross-modal independent matching network for image-text retrieval",
JOURNAL = PR,
VOLUME = "159",
YEAR = "2025",
PAGES = "111096",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238258"}
@article{bb243345,
AUTHOR = "Li, Z. and Guo, C. and Wang, X. and Feng, Z. and Du, Z.T.",
TITLE = "Selectively Hard Negative Mining for Alleviating Gradient Vanishing
in Image-Text Matching",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "2",
MONTH = "February",
PAGES = "1921-1935",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238259"}
@article{bb243346,
AUTHOR = "Yang, X.Y. and Li, C. and Wang, Z.M. and Xie, H. and Mao, J. and Yin, G.Q.",
TITLE = "Remote Sensing Cross-Modal Text-Image Retrieval Based on Attention
Correction and Filtering",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "3",
PAGES = "503",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238260"}
@article{bb243347,
AUTHOR = "Wu, D.Q. and Li, H.H. and Gu, C. and Guo, L. and Liu, H.",
TITLE = "Dual Stream Relation Learning Network for Image-Text Retrieval",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "1551-1565",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238261"}
@article{bb243348,
AUTHOR = "Liu, Z. and Xu, J.H. and Gao, S.S. and Chen, Z.",
TITLE = "CSA: Cross-scale alignment with adaptive semantic aggregation and
filter for image-text retrieval",
JOURNAL = PR,
VOLUME = "165",
YEAR = "2025",
PAGES = "111647",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238262"}
@article{bb243349,
AUTHOR = "Zhang, Q. and Wang, D. and Yu, X.",
TITLE = "RLita: A Region-Level Image-Text Alignment Method for Remote Sensing
Foundation Model",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "10",
PAGES = "1661",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238263"}
@article{bb243350,
AUTHOR = "Wen, Z.T. and Liu, J.H. and Zhang, H. and Zuo, F.Y.",
TITLE = "Exploring Fine-Grained Visual-Text Feature Alignment With Prompt
Tuning for Domain-Adaptive Object Detection",
JOURNAL = Cyber,
VOLUME = "55",
YEAR = "2025",
NUMBER = "7",
MONTH = "July",
PAGES = "3220-3233",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238264"}
@article{bb243351,
AUTHOR = "Guan, J.H. and Shu, Y. and Li, W. and Song, Z. and Zhang, Y.C.",
TITLE = "PR-CLIP: Cross-Modal Positional Reconstruction for Remote Sensing
Image-Text Retrieval",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "13",
PAGES = "2117",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238265"}
@article{bb243352,
AUTHOR = "Song, Z. and Shu, Y. and Li, W. and Guan, J.H. and Zhang, Y.C.",
TITLE = "Towards Discriminative and Consistent Cross-Modal Alignment for
Remote Sensing Image-Text Retrieval",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "4",
PAGES = "662",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238266"}
@article{bb243353,
AUTHOR = "Zhao, H. and Li, Z.Y. and Wang, S. and Zhang, Z.X. and Li, K.Q.",
TITLE = "Robust Hashing With Bilinear Drift for Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "8",
MONTH = "August",
PAGES = "7642-7654",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238267"}
@article{bb243354,
AUTHOR = "Wang, P.Z. and Zhang, L. and Mao, Z.D. and Lyu, N. and Zhang, Y.D.",
TITLE = "Matryoshka Learning With Metric Transfer for Image-Text Matching",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "9",
MONTH = "September",
PAGES = "9502-9516",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238268"}
@article{bb243355,
AUTHOR = "Koo, H. and Shin, J. and Kim, E.",
TITLE = "Dual-branch scale disentanglement for text-video retrieval",
JOURNAL = PRL,
VOLUME = "196",
YEAR = "2025",
PAGES = "296-302",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238269"}
@article{bb243356,
AUTHOR = "Zhou, J. and Wang, M.",
TITLE = "Unified learning for image-text alignment via multi-scale feature
fusion",
JOURNAL = CVIU,
VOLUME = "260",
YEAR = "2025",
PAGES = "104468",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238270"}
@article{bb243357,
AUTHOR = "Wen, J. and Chen, Y.F. and Shi, R.Q. and Ji, W. and Yang, M.L. and Gao, D.F. and Yuan, J.S. and Zimmermann, R.",
TITLE = "HOVER: Hyperbolic Video-Text Retrieval",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "6192-6203",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238271"}
@article{bb243358,
AUTHOR = "Fang, J.Y. and Zhu, B. and Yuan, J.L. and Chen, Y.Y. and Tang, M. and Wang, J.Q.",
TITLE = "AMITA: Attribute-Guided Masked Image-Text Alignment for Multi-Label
Image Representation",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "11432-11447",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238272"}
@article{bb243359,
AUTHOR = "Ji, L.L. and Liu, L.",
TITLE = "Multi-Scale Feature Fusion Based on Piecewise Polynomial Activation
Function for Image-Text Matching",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "11627-11640",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238273"}
@article{bb243360,
AUTHOR = "Chen, R. and Su, T. and Wang, H. and Ni, Z.K.",
TITLE = "Similarity Shuffled Criss-Cross Transformer With Angle Loss for
Image-Text Matching",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "9723-9734",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238274"}
@article{bb243361,
AUTHOR = "Chen, D. and Wang, Y.T. and Xie, Y.Z. and Chen, S.Y. and Peng, W.L. and Tang, M. and Fang, M. and Chen, C.L.P. and Li, P. and Zhang, W.",
TITLE = "Intra-modal consistency for image-text retrieval through soft-label
distillation",
JOURNAL = PR,
VOLUME = "173",
YEAR = "2026",
PAGES = "112817",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238275"}
@article{bb243362,
AUTHOR = "Shi, Z.X. and Ding, Y. and Dong, J.Y. and Zhang, T.Z.",
TITLE = "Beyond One and Two Tower: Cross-Modal Consensus Learning for
Image-Text Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "2",
MONTH = "February",
PAGES = "2581-2593",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238276"}
@article{bb243363,
AUTHOR = "Wang, H.C. and Liu, L. and Zhang, H.X. and Zhu, L. and Chang, X.J. and Du, H.",
TITLE = "VisualRAG: Knowledge-Guided Retrieval Augmentation for Image-Text
Matching",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "1",
MONTH = "January",
PAGES = "1234-1248",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238277"}
@article{bb243364,
AUTHOR = "Zhang, D.L. and Wang, Z.W. and Wu, X.J. and Kittler, J.V.",
TITLE = "HACG: Leveraging Hierarchical Alignment and Caption Generation for
Text-Video Retrieval",
JOURNAL = IJCV,
VOLUME = "134",
YEAR = "2026",
NUMBER = "1",
MONTH = "January",
PAGES = "93",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238278"}
@article{bb243365,
AUTHOR = "Zhang, B. and Wu, H.",
TITLE = "Test-Time Candidate-Aware Dual Refinement for Remote Sensing
Image-Text Retrieval",
JOURNAL = RS,
VOLUME = "18",
YEAR = "2026",
NUMBER = "9",
PAGES = "1389",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238279"}
@article{bb243366,
AUTHOR = "Wang, Z. and Xu, X. and Zhu, L. and Song, J.K. and Yang, Y. and Shen, H.T.",
TITLE = "Distribution-to-Points Matching for Image Text Retrieval",
JOURNAL = PAMI,
VOLUME = "48",
YEAR = "2026",
NUMBER = "6",
MONTH = "June",
PAGES = "7097-7111",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238280"}
@article{bb243367,
AUTHOR = "Huang, J. and Chen, Y.X. and Du, C. and Xiong, S.W. and Lu, X.Q.",
TITLE = "ReCoTR: Reducing Semantic Cognitive Shift via Dual-Consensus Token
Compression for Remote Sensing Image-Text Retrieval",
JOURNAL = IP,
VOLUME = "35",
YEAR = "2026",
PAGES = "5017-5031",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238281"}
@article{bb243368,
AUTHOR = "Wang, K. and Hu, Y.P. and Liu, H. and Jie, L.R. and Nie, L.Q.",
TITLE = "Redundancy Mitigation: Toward Accurate and Efficient Image-Text
Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "36",
YEAR = "2026",
NUMBER = "5",
MONTH = "May",
PAGES = "7155-7167",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238282"}
@inproceedings{bb243369,
AUTHOR = "Vongala, M.R. and Srivastava, S. and Kosecka, J.",
TITLE = "Compositional Image-Text Matching and Retrieval by Grounding Entities",
BOOKTITLE = "MULA25",
YEAR = "2025",
PAGES = "241-250",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238283"}
@inproceedings{bb243370,
AUTHOR = "Zhang, Z.C. and Li, X.Y. and Sun, W. and Zhang, Z.C. and Li, Y.H. and Liu, X.H. and Zhai, G.T.",
TITLE = "Leveraging Multimodal Large Language Models for Joint Discrete and
Continuous Evaluation in Text-to-Image Alignment",
BOOKTITLE = NTIRE25,
YEAR = "2025",
PAGES = "968-977",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238284"}
@inproceedings{bb243371,
AUTHOR = "Zhang, Z.J. and Zheng, X.H. and Wu, X.C. and Peng, C. and Cao, X.Z.",
TITLE = "Tokenfocus-VQA: Enhancing Text-to-Image Alignment with Position-Aware
Focus and Multi-Perspective Aggregations on LVLMs",
BOOKTITLE = NTIRE25,
YEAR = "2025",
PAGES = "1270-1279",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238285"}
@inproceedings{bb243372,
AUTHOR = "Yue, X. and Sun, J. and Lu, J. and Yao, L.C. and XIA, F. and Wang, T.Y. and Rao, F.Y. and LYU, J. and Deng, Y.",
TITLE = "Instruction-Augmented Multimodal Alignment for Image-Text and Element
Matching",
BOOKTITLE = NTIRE25,
YEAR = "2025",
PAGES = "1370-1379",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238286"}
@inproceedings{bb243373,
AUTHOR = "Lai, H. and Xiong, G.X. and Mai, H.Y. and Liu, X. and Zhang, T.Z.",
TITLE = "Rethinking Noisy Video-Text Retrieval via Relation-aware Alignment",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "9231-9241",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238287"}
@inproceedings{bb243374,
AUTHOR = "Kim, D. and Piergiovanni, A. and Mallya, G. and Angelova, A.",
TITLE = "VideoComp: Advancing Fine-Grained Compositional and Temporal
Alignment in Video-Text Models",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "29060-29070",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238288"}
@inproceedings{bb243375,
AUTHOR = "Shen, L. and Gong, G.Q. and Hao, T.X. and He, T. and Zhang, Y.F. and Liu, P.Z. and Zhao, S.C. and Han, J.G. and Ding, G.",
TITLE = "DiscoVLA: Discrepancy Reduction in Vision, Language, and Alignment
for Parameter-Efficient Video-Text Retrieval",
BOOKTITLE = CVPR25,
YEAR = "2025",
PAGES = "19702-19712",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238289"}
@inproceedings{bb243376,
AUTHOR = "Jin, Z.X. and Xu, X.W. and Wang, X.D.",
TITLE = "MADA:Multi-Window Attention and Dual-Alignment for Image-Text
Retrieval",
BOOKTITLE = ICIVC24,
YEAR = "2024",
PAGES = "240-245",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238290"}
@inproceedings{bb243377,
AUTHOR = "Xie, C.W. and Sun, S.Y. and Zhao, L.M. and Li, P. and Ma, S. and Zheng, Y.",
TITLE = "Fuseteacher: Modality-fused Encoders are Strong Vision Supervisors",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLVIII: 287-304",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238291"}
@inproceedings{bb243378,
AUTHOR = "Kim, W. and Chun, S. and Kim, T. and Han, D.Y. and Yun, S.",
TITLE = "HYPE: Hyperbolic Entailment Filtering for Underspecified Images and
Texts",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XL: 247-265",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238292"}
@inproceedings{bb243379,
AUTHOR = "Sogi, N. and Shibata, T. and Terao, M.",
TITLE = "Object-aware Query Perturbation for Cross-modal Image-text Retrieval",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LXXIX: 447-464",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238293"}
@inproceedings{bb243380,
AUTHOR = "Alper, M. and Averbuch Elor, H.",
TITLE = "Emergent Visual-semantic Hierarchies in Image-text Representations",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LII: 220-238",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238294"}
@inproceedings{bb243381,
AUTHOR = "Gordon, B. and Bitton, Y. and Shafir, Y. and Garg, R. and Chen, X. and Lischinski, D. and Cohen Or, D. and Szpektor, I.",
TITLE = "Mismatch Quest: Visual and Textual Feedback for Image-Text Misalignment",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "LVII: 310-328",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238295"}
@inproceedings{bb243382,
AUTHOR = "Hua, H. and Shi, J. and Kafle, K. and Jenni, S. and Zhang, D. and Collomosse, J. and Cohen, S. and Luo, J.B.",
TITLE = "Finematch: Aspect-based Fine-grained Image and Text Mismatch Detection
and Correction",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "IX: 474-491",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238296"}
@inproceedings{bb243383,
AUTHOR = "Li, Y.H. and Liu, H.T. and Cai, M. and Li, Y.J. and Shechtman, E. and Lin, Z. and Lee, Y.J. and Singh, K.K.",
TITLE = "Removing Distributional Discrepancies in Captions Improves Image-Text
Alignment",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XXI: 405-422",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238297"}
@inproceedings{bb243384,
AUTHOR = "Ma, W. and Li, K. and Jiang, Z. and Meshry, M. and Liu, Q.H. and Wang, H.Y. and Hane, C. and Yuille, A.L.",
TITLE = "Rethinking Video-text Understanding: Retrieval from Counterfactually
Augmented Data",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XIII: 254-269",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238298"}
@inproceedings{bb243385,
AUTHOR = "Zhang, W. and Xu, X.W. and Tao, Y. and Wang, X.D. and Wang, C.L. and Wei, Z.M.",
TITLE = "Bi-Directional Image-Text Retrieval With Position Attention and
Similarity Filtering",
BOOKTITLE = ICIVC22,
YEAR = "2022",
PAGES = "635-640",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238299"}
@inproceedings{bb243386,
AUTHOR = "Li, Z. and Nian, X.H. and Pan, C. and Yang, D. and Xiong, H.Y. and Wang, H.B.",
TITLE = "Relation Graph Reasoning for Image-Text Matching",
BOOKTITLE = ICIVC22,
YEAR = "2022",
PAGES = "319-324",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238300"}
@inproceedings{bb243387,
AUTHOR = "Zhang, K. and Mao, Z.D. and Wang, Q. and Zhang, Y.D.",
TITLE = "Negative-Aware Attention Framework for Image-Text Matching",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "15640-15649",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238301"}
@inproceedings{bb243388,
AUTHOR = "Long, S. and Han, S.C. and Wan, X.J. and Poon, J.",
TITLE = "GraDual: Graph-based Dual-modal Representation for Image-Text
Matching",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2463-2472",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238302"}
@inproceedings{bb243389,
AUTHOR = "Biten, A.F. and Mafla, A. and Gomez, L. and Karatzas, D.",
TITLE = "Is An Image Worth Five Sentences? A New Look into Semantics for
Image-Text Matching",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2483-2492",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238303"}
@inproceedings{bb243390,
AUTHOR = "Mithun, N.C. and Pasricha, R. and Papalexakis, E. and Roy Chowdhury, A.K.",
TITLE = "Webly Supervised Image-Text Embedding with Noisy Tag Refinement",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "7454-7461",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238304"}
@inproceedings{bb243391,
AUTHOR = "Chen, J.A. and Zhang, L. and Wang, Q. and Bai, C. and Kpalma, K.",
TITLE = "Intra-Modal Constraint Loss for Image-Text Retrieval",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "4023-4027",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238305"}
@inproceedings{bb243392,
AUTHOR = "Liu, Y. and Wang, H.Q. and Meng, F.Y. and Liu, M.Y. and Liu, H.",
TITLE = "Attend, Correct and Focus: A Bidirectional Correct Attention Network
for Image-Text Matching",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2673-2677",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238306"}
@inproceedings{bb243393,
AUTHOR = "Yang, S.T. and Huang, K.H. and Howe, B.",
TITLE = "JECL: Joint Embedding and Cluster Learning for Image-Text Pairs",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "8344-8351",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238307"}
@inproceedings{bb243394,
AUTHOR = "Mikriukov, G. and Ravanbakhsh, M. and Demir, B.",
TITLE = "An Unsupervised Cross-Modal Hashing Method Robust to Noisy Training
Image-Text Correspondences in Remote Sensing",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "2556-2560",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238308"}
@inproceedings{bb243395,
AUTHOR = "Anwaar, M.U. and Labintcev, E. and Kleinsteuber, M.",
TITLE = "Compositional Learning of Image-Text Query for Image Retrieval",
BOOKTITLE = WACV21,
YEAR = "2021",
PAGES = "1139-1148",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238309"}
@inproceedings{bb243396,
AUTHOR = "Messina, N. and Falchi, F. and Esuli, A. and Amato, G.",
TITLE = "Transformer Reasoning Network for Image-Text Matching and Retrieval",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "5222-5229",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238310"}
@inproceedings{bb243397,
AUTHOR = "Zhang, Q. and Lei, Z. and Zhang, Z.X. and Li, S.Z.",
TITLE = "Context-Aware Attention Network for Image-Text Retrieval",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "3533-3542",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238311"}
@inproceedings{bb243398,
AUTHOR = "Chen, Y.C. and Li, L.J. and Yu, L.C. and El Kholy, A. and Ahmed, F. and Gan, Z. and Cheng, Y. and Liu, J.J.",
TITLE = "Uniter: Universal Image-Text Representation Learning",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXX: 104-120",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238312"}
@inproceedings{bb243399,
AUTHOR = "Wang, H.R. and Zhang, Y. and Ji, Z. and Pang, Y.W. and Ma, L.",
TITLE = "Consensus-aware Visual-semantic Embedding for Image-Text Matching",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXIV:18-34",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT238313"}
Last update:Jun 4, 2026 at 16:38:45