@inproceedings{bb241100,
AUTHOR = "Li, Z. and Nian, X.H. and Pan, C. and Yang, D. and Xiong, H.Y. and Wang, H.B.",
TITLE = "Relation Graph Reasoning for Image-Text Matching",
BOOKTITLE = ICIVC22,
YEAR = "2022",
PAGES = "319-324",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236017"}
@inproceedings{bb241101,
AUTHOR = "Zhang, K. and Mao, Z.D. and Wang, Q. and Zhang, Y.D.",
TITLE = "Negative-Aware Attention Framework for Image-Text Matching",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "15640-15649",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236018"}
@inproceedings{bb241102,
AUTHOR = "Long, S. and Han, S.C. and Wan, X.J. and Poon, J.",
TITLE = "GraDual: Graph-based Dual-modal Representation for Image-Text
Matching",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2463-2472",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236019"}
@inproceedings{bb241103,
AUTHOR = "Biten, A.F. and Mafla, A. and Gomez, L. and Karatzas, D.",
TITLE = "Is An Image Worth Five Sentences? A New Look into Semantics for
Image-Text Matching",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2483-2492",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236020"}
@inproceedings{bb241104,
AUTHOR = "Mithun, N.C. and Pasricha, R. and Papalexakis, E. and Roy Chowdhury, A.K.",
TITLE = "Webly Supervised Image-Text Embedding with Noisy Tag Refinement",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "7454-7461",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236021"}
@inproceedings{bb241105,
AUTHOR = "Chen, J.A. and Zhang, L. and Wang, Q. and Bai, C. and Kpalma, K.",
TITLE = "Intra-Modal Constraint Loss for Image-Text Retrieval",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "4023-4027",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236022"}
@inproceedings{bb241106,
AUTHOR = "Liu, Y. and Wang, H.Q. and Meng, F.Y. and Liu, M.Y. and Liu, H.",
TITLE = "Attend, Correct and Focus: A Bidirectional Correct Attention Network
for Image-Text Matching",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2673-2677",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236023"}
@inproceedings{bb241107,
AUTHOR = "Yang, S.T. and Huang, K.H. and Howe, B.",
TITLE = "JECL: Joint Embedding and Cluster Learning for Image-Text Pairs",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "8344-8351",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236024"}
@inproceedings{bb241108,
AUTHOR = "Mikriukov, G. and Ravanbakhsh, M. and Demir, B.",
TITLE = "An Unsupervised Cross-Modal Hashing Method Robust to Noisy Training
Image-Text Correspondences in Remote Sensing",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "2556-2560",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236025"}
@inproceedings{bb241109,
AUTHOR = "Anwaar, M.U. and Labintcev, E. and Kleinsteuber, M.",
TITLE = "Compositional Learning of Image-Text Query for Image Retrieval",
BOOKTITLE = WACV21,
YEAR = "2021",
PAGES = "1139-1148",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236026"}
@inproceedings{bb241110,
AUTHOR = "Messina, N. and Falchi, F. and Esuli, A. and Amato, G.",
TITLE = "Transformer Reasoning Network for Image-Text Matching and Retrieval",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "5222-5229",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236027"}
@inproceedings{bb241111,
AUTHOR = "Zhang, Q. and Lei, Z. and Zhang, Z.X. and Li, S.Z.",
TITLE = "Context-Aware Attention Network for Image-Text Retrieval",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "3533-3542",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236028"}
@inproceedings{bb241112,
AUTHOR = "Chen, Y.C. and Li, L.J. and Yu, L.C. and El Kholy, A. and Ahmed, F. and Gan, Z. and Cheng, Y. and Liu, J.J.",
TITLE = "Uniter: Universal Image-Text Representation Learning",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXX: 104-120",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236029"}
@inproceedings{bb241113,
AUTHOR = "Wang, H.R. and Zhang, Y. and Ji, Z. and Pang, Y.W. and Ma, L.",
TITLE = "Consensus-aware Visual-semantic Embedding for Image-Text Matching",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXIV:18-34",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236030"}
@inproceedings{bb241114,
AUTHOR = "Chen, T.L. and Deng, J.J. and Luo, J.B.",
TITLE = "Adaptive Offline Quintuplet Loss for Image-text Matching",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XIII:549-565",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236031"}
@inproceedings{bb241115,
AUTHOR = "Lee, K.H. and Chen, X. and Hua, G. and Hu, H.D. and He, X.D.",
TITLE = "Stacked Cross Attention for Image-Text Matching",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "II: 212-228",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236032"}
@inproceedings{bb241116,
AUTHOR = "Plummer, B.A. and Kordas, P. and Kiapour, M.H. and Zheng, S. and Piramuthu, R. and Lazebnik, S.",
TITLE = "Conditional Image-Text Embedding Networks",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "XII: 258-274",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803imt4.html#TT236033"}
@article{bb241117,
AUTHOR = "Yang, Z.Y. and Kumar, T. and Chen, T.L. and Su, J.S. and Luo, J.B.",
TITLE = "Grounding-Tracking-Integration",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "9",
MONTH = "September",
PAGES = "3433-3443",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236034"}
@article{bb241118,
AUTHOR = "Zhang, W.X. and Ma, C. and Wu, Q. and Yang, X.K.",
TITLE = "Language-Guided Navigation via Cross-Modal Grounding and Alternate
Adversarial Learning",
JOURNAL = CirSysVideo,
VOLUME = "31",
YEAR = "2021",
NUMBER = "9",
MONTH = "September",
PAGES = "3469-3481",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236035"}
@article{bb241119,
AUTHOR = "Zhai, S.L. and Guo, G.B. and Yuan, F.J. and Liu, Y. and Wang, X.W.",
TITLE = "VSE-fs: Fast Full-Sample Visual Semantic Embedding",
JOURNAL = IEEE_Int_Sys,
VOLUME = "36",
YEAR = "2021",
NUMBER = "4",
MONTH = "July",
PAGES = "3-12",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236036"}
@article{bb241120,
AUTHOR = "Bargal, S.A. and Zunino, A. and Petsiuk, V. and Zhang, J.M. and Saenko, K. and Murino, V. and Sclaroff, S.",
TITLE = "Guided Zoom: Zooming into Network Evidence to Refine Fine-Grained
Model Decisions",
JOURNAL = PAMI,
VOLUME = "43",
YEAR = "2021",
NUMBER = "11",
MONTH = "November",
PAGES = "4196-4202",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236037"}
@article{bb241121,
AUTHOR = "Hong, R.C. and Liu, D. and Mo, X.Y. and He, X.N. and Zhang, H.W.",
TITLE = "Learning to Compose and Reason with Language Tree Structures for
Visual Grounding",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "2",
MONTH = "February",
PAGES = "684-696",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236038"}
@inproceedings{bb241122,
AUTHOR = "Tang, K.H. and Zhang, H.W. and Wu, B.Y. and Luo, W.H. and Liu, W.",
TITLE = "Learning to Compose Dynamic Tree Structures for Visual Contexts",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6612-6621",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236039"}
@article{bb241123,
AUTHOR = "Bin, Y. and Ding, Y.J. and Peng, B. and Peng, L. and Yang, Y. and Chua, T.S.",
TITLE = "Entity Slot Filling for Visual Captioning",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "1",
MONTH = "January",
PAGES = "52-62",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236040"}
@article{bb241124,
AUTHOR = "Chu, C. and Oliveira, V. and Virgo, F.G. and Otani, M. and Garcia, N. and Nakashima, Y.",
TITLE = "The semantic typology of visually grounded paraphrases",
JOURNAL = CVIU,
VOLUME = "215",
YEAR = "2022",
PAGES = "103333",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236041"}
@article{bb241125,
AUTHOR = "Deng, C.R. and Wu, Q. and Wu, Q.Y. and Hu, F.Y. and Lyu, F. and Tan, M.K.",
TITLE = "Visual Grounding Via Accumulated Attention",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "3",
MONTH = "March",
PAGES = "1670-1684",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236042"}
@inproceedings{bb241126,
AUTHOR = "Tan, M.K. and Lyu, F. and Hu, F.Y. and Wu, Q.Y. and Wu, Q. and Deng, C.R.",
TITLE = "Visual Grounding Via Accumulated Attention",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "7746-7755",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236042"}
@article{bb241127,
AUTHOR = "Yu, X.T. and Zhang, H.M. and Hong, R.X. and Song, Y.Q. and Zhang, C.S.",
TITLE = "VD-PCR: Improving visual dialog with pronoun coreference resolution",
JOURNAL = PR,
VOLUME = "125",
YEAR = "2022",
PAGES = "108540",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236043"}
@article{bb241128,
AUTHOR = "Yuan, Y.T. and Ma, L. and Wang, J.W. and Liu, W. and Zhu, W.W.",
TITLE = "Semantic Conditioned Dynamic Modulation for Temporal Sentence
Grounding in Videos",
JOURNAL = PAMI,
VOLUME = "44",
YEAR = "2022",
NUMBER = "5",
MONTH = "May",
PAGES = "2725-2741",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236044"}
@article{bb241129,
AUTHOR = "He, S. and Yang, X.F. and Lin, G.S.",
TITLE = "Learning language to symbol and language to vision mapping for visual
grounding",
JOURNAL = IVC,
VOLUME = "122",
YEAR = "2022",
PAGES = "104451",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236045"}
@article{bb241130,
AUTHOR = "Jiang, W.H. and Zhu, M. and Fang, Y.M. and Shi, G.M. and Zhao, X.W. and Liu, Y.",
TITLE = "Visual Cluster Grounding for Image Captioning",
JOURNAL = IP,
VOLUME = "31",
YEAR = "2022",
PAGES = "3920-3934",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236046"}
@article{bb241131,
AUTHOR = "Liao, Y. and Zhang, A. and Chen, Z.Y. and Hui, T.R. and Liu, S.",
TITLE = "Progressive Language-Customized Visual Feature Learning for One-Stage
Visual Grounding",
JOURNAL = IP,
VOLUME = "31",
YEAR = "2022",
PAGES = "4266-4277",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236047"}
@article{bb241132,
AUTHOR = "Ding, X.P. and Wang, N.N. and Zhang, S.W. and Huang, Z.Y. and Li, X.M. and Tang, M.Q. and Liu, T.L. and Gao, X.B.",
TITLE = "Exploring Language Hierarchy for Video Grounding",
JOURNAL = IP,
VOLUME = "31",
YEAR = "2022",
PAGES = "4693-4706",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236048"}
@article{bb241133,
AUTHOR = "Xu, Z. and Chen, D. and Wei, K. and Deng, C. and Xue, H.",
TITLE = "HiSA: Hierarchically Semantic Associating for Video Temporal
Grounding",
JOURNAL = IP,
VOLUME = "31",
YEAR = "2022",
PAGES = "5178-5188",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236049"}
@article{bb241134,
AUTHOR = "Gao, J.L. and Sun, X. and Ghanem, B. and Zhou, X. and Ge, S.M.",
TITLE = "Efficient Video Grounding With Which-Where Reading Comprehension",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "10",
MONTH = "October",
PAGES = "6900-6913",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236050"}
@article{bb241135,
AUTHOR = "Zhou, H. and Zhang, C.Y. and Luo, Y. and Hu, C.P. and Zhang, W.J.",
TITLE = "Thinking Inside Uncertainty: Interest Moment Perception for Diverse
Temporal Grounding",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "10",
MONTH = "October",
PAGES = "7190-7203",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236051"}
@article{bb241136,
AUTHOR = "Tang, Z.H. and Liao, Y. and Liu, S. and Li, G.B. and Jin, X.J. and Jiang, H.X. and Yu, Q. and Xu, D.",
TITLE = "Human-Centric Spatio-Temporal Video Grounding With Visual
Transformers",
JOURNAL = CirSysVideo,
VOLUME = "32",
YEAR = "2022",
NUMBER = "12",
MONTH = "December",
PAGES = "8238-8249",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236052"}
@article{bb241137,
AUTHOR = "Wang, W. and Gao, J.Y. and Xu, C.S.",
TITLE = "Weakly-Supervised Video Object Grounding via Causal Intervention",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "3",
MONTH = "March",
PAGES = "3933-3948",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236053"}
@article{bb241138,
AUTHOR = "Wang, W. and Gao, J.Y. and Xu, C.S.",
TITLE = "Weakly-Supervised Video Object Grounding via Learning Uni-Modal
Associations",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "6329-6340",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236054"}
@article{bb241139,
AUTHOR = "Nayyeri, M. and Xu, C.J. and Alam, M.M. and Lehmann, J. and Yazdi, H.S.",
TITLE = "LogicENN: A Neural Based Knowledge Graphs Embedding Model With
Logical Rules",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "6",
MONTH = "June",
PAGES = "7050-7062",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236055"}
@article{bb241140,
AUTHOR = "Chen, T.B. and Wang, W. and Han, K. and Xu, H.J.",
TITLE = "SaGCN: Semantic-Aware Graph Calibration Network for Temporal Sentence
Grounding",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "6",
MONTH = "June",
PAGES = "3003-3016",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236056"}
@article{bb241141,
AUTHOR = "Zhang, H. and Sun, A. and Jing, W. and Zhou, J.T.Y.",
TITLE = "Temporal Sentence Grounding in Videos: A Survey and Future Directions",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "8",
MONTH = "August",
PAGES = "10443-10465",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236057"}
@article{bb241142,
AUTHOR = "Deng, J.J. and Yang, Z.Y. and Liu, D. and Chen, T.L. and Zhou, W.G. and Zhang, Y. and Li, H.Q. and Ouyang, W.L.",
TITLE = "TransVG++: End-to-End Visual Grounding With Language Conditioned
Vision Transformer",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "11",
MONTH = "November",
PAGES = "13636-13652",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236058"}
@inproceedings{bb241143,
AUTHOR = "Deng, J.J. and Yang, Z.Y. and Chen, T.L. and Zhou, W.G. and Li, H.Q.",
TITLE = "TransVG: End-to-End Visual Grounding with Transformers",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "1749-1759",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236059"}
@article{bb241144,
AUTHOR = "Li, J.C. and Tang, S.L. and Zhu, L.C. and Zhang, W.Q. and Yang, Y. and Chua, T.S. and Wu, F. and Zhuang, Y.T.",
TITLE = "Variational Cross-Graph Reasoning and Adaptive Structured Semantics
Learning for Compositional Temporal Grounding",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "10",
MONTH = "October",
PAGES = "12601-12617",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236060"}
@inproceedings{bb241145,
AUTHOR = "Li, J.C. and Xie, J.L. and Qian, L. and Zhu, L.C. and Tang, S.L. and Wu, F. and Yang, Y. and Zhuang, Y.T. and Wang, X.E.",
TITLE = "Compositional Temporal Grounding with Structured Variational
Cross-Graph Correspondence Learning",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "3022-3031",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236061"}
@article{bb241146,
AUTHOR = "Gonzalez, C. and Ayobi, N. and Hernandez, I. and Pont Tuset, J. and Arbelaez, P.",
TITLE = "PiGLET:
Pixel-Level Grounding of Language Expressions With Transformers",
JOURNAL = PAMI,
VOLUME = "45",
YEAR = "2023",
NUMBER = "10",
MONTH = "October",
PAGES = "12206-12221",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236062"}
@article{bb241147,
AUTHOR = "Zhang, R.S. and Wang, C. and Liu, C.L.",
TITLE = "Cycle-Consistent Weakly Supervised Visual Grounding With Individual
and Contextual Representations",
JOURNAL = IP,
VOLUME = "32",
YEAR = "2023",
PAGES = "5167-5180",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236063"}
@article{bb241148,
AUTHOR = "Wang, Y. and Su, Y.T. and Li, W.H. and Xiao, J. and Li, X.Y. and Liu, A.A.",
TITLE = "Dual-Path Rare Content Enhancement Network for Image and Text
Matching",
JOURNAL = CirSysVideo,
VOLUME = "33",
YEAR = "2023",
NUMBER = "10",
MONTH = "October",
PAGES = "6144-6158",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236064"}
@article{bb241149,
AUTHOR = "Xu, Z. and Wei, K. and Yang, X. and Deng, C.",
TITLE = "Point-Supervised Video Temporal Grounding",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "6121-6131",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236065"}
@article{bb241150,
AUTHOR = "Luo, F. and Chen, S.X. and Chen, J.J. and Wu, Z.X. and Jiang, Y.G.",
TITLE = "Self-Supervised Learning for Semi-Supervised Temporal Language
Grounding",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "7747-7757",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236066"}
@article{bb241151,
AUTHOR = "Liu, D.Z. and Fang, X. and Hu, W. and Zhou, P.",
TITLE = "Exploring Optical-Flow-Guided Motion and Detection-Based Appearance
for Temporal Sentence Grounding",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "8539-8553",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236067"}
@article{bb241152,
AUTHOR = "Yang, X.F. and Liu, F. and Lin, G.S.",
TITLE = "Effective End-to-End Vision Language Pretraining With Semantic Visual
Loss",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "8408-8417",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236068"}
@article{bb241153,
AUTHOR = "Ma, G.Q. and Bai, Y. and Zhang, W. and Yao, T. and Shihada, B. and Mei, T.",
TITLE = "Boosting Generic Visual-Linguistic Representation With Dynamic
Contexts",
JOURNAL = MultMed,
VOLUME = "25",
YEAR = "2023",
PAGES = "8445-8457",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236069"}
@article{bb241154,
AUTHOR = "Su, C. and Li, Z. and Lei, T.Y. and Peng, D.Z. and Wang, X.",
TITLE = "MetaVG: A Meta-Learning Framework for Visual Grounding",
JOURNAL = SPLetters,
VOLUME = "31",
YEAR = "2024",
PAGES = "236-240",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236070"}
@article{bb241155,
AUTHOR = "Fang, X. and Liu, D. and Zhou, P. and Xu, Z.C. and Li, R.X.",
TITLE = "Hierarchical Local-Global Transformer for Temporal Sentence Grounding",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "3263-3277",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236071"}
@article{bb241156,
AUTHOR = "Wang, Z.Y. and Yang, C. and Jiang, B. and Yuan, J.S.",
TITLE = "A Dual Reinforcement Learning Framework for Weakly Supervised Phrase
Grounding",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "394-405",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236072"}
@article{bb241157,
AUTHOR = "Lu, Y. and Quan, R.J. and Zhu, L.C. and Yang, Y.",
TITLE = "Zero-Shot Video Grounding With Pseudo Query Lookup and Verification",
JOURNAL = IP,
VOLUME = "33",
YEAR = "2024",
PAGES = "1643-1654",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236073"}
@article{bb241158,
AUTHOR = "Wang, W.K. and Su, Y.T. and Liu, J. and Jing, P.G.",
TITLE = "Adaptive proposal network based on generative adversarial learning
for weakly supervised temporal sentence grounding",
JOURNAL = PRL,
VOLUME = "179",
YEAR = "2024",
PAGES = "9-16",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236074"}
@article{bb241159,
AUTHOR = "Liu, M. and Zhou, D. and Guo, J. and Luo, X. and Gao, Z. and Nie, L.Q.",
TITLE = "Semantic-Aware Contrastive Learning With Proposal Suppression for
Video Semantic Role Grounding",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "4",
MONTH = "April",
PAGES = "3003-3016",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236075"}
@article{bb241160,
AUTHOR = "Tang, W. and Li, L. and Liu, X.J. and Jin, L. and Tang, J.H. and Li, Z.C.",
TITLE = "Context Disentangling and Prototype Inheriting for Robust Visual
Grounding",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "5",
MONTH = "May",
PAGES = "3213-3229",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236076"}
@article{bb241161,
AUTHOR = "Shi, F.Y. and Huang, W.L. and Wang, L.M.",
TITLE = "End-to-end dense video grounding via parallel regression",
JOURNAL = CVIU,
VOLUME = "242",
YEAR = "2024",
PAGES = "103980",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236077"}
@article{bb241162,
AUTHOR = "Shao, R. and Wu, T.X. and Wu, J.L. and Nie, L.Q. and Liu, Z.W.",
TITLE = "Detecting and Grounding Multi-Modal Media Manipulation and Beyond",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "8",
MONTH = "August",
PAGES = "5556-5574",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236078"}
@inproceedings{bb241163,
AUTHOR = "Shao, R. and Wu, T.X. and Liu, Z.W.",
TITLE = "Detecting and Grounding Multi-Modal Media Manipulation",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "6904-6913",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236079"}
@article{bb241164,
AUTHOR = "Chen, L. and Deng, Z. and Liu, L.B. and Yin, S.",
TITLE = "Multilevel Semantic Interaction Alignment for Video-Text Cross-Modal
Retrieval",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "7",
MONTH = "July",
PAGES = "6559-6575",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236080"}
@article{bb241165,
AUTHOR = "Wu, Q.Q. and Guo, L.J. and Zhang, R. and Qian, J.B. and Gao, S.",
TITLE = "QSMT-net: A query-sensitive proposal and multi-temporal-span matching
network for video grounding",
JOURNAL = IVC,
VOLUME = "149",
YEAR = "2024",
PAGES = "105188",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236081"}
@article{bb241166,
AUTHOR = "Wu, W. and Cao, M. and Hu, Y. and Peng, Y. and Qin, L. and Yin, Q.",
TITLE = "Visual Grounding With Dual Knowledge Distillation",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "10",
MONTH = "October",
PAGES = "10399-10410",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236082"}
@article{bb241167,
AUTHOR = "Li, S.T. and Li, B. and Sun, B. and Weng, Y.X.",
TITLE = "Towards Visual-Prompt Temporal Answer Grounding in Instructional
Video",
JOURNAL = PAMI,
VOLUME = "46",
YEAR = "2024",
NUMBER = "12",
MONTH = "December",
PAGES = "8836-8853",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236083"}
@inproceedings{bb241168,
AUTHOR = "Fang, X. and Xiong, Z. and Fang, W.L. and Qu, X.Y. and Chen, C. and Dongd, J.F. and Tang, K. and Zhou, P. and Cheng, Y. and Liu, D.Z.",
TITLE = "Rethinking Weakly-supervised Video Temporal Grounding From a Game
Perspective",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLV: 290-311",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236084"}
@article{bb241169,
AUTHOR = "Xiong, Z. and Liu, D.Z. and Fang, X. and Qu, X.Y. and Dong, J.F. and Zhu, J.H. and Tang, K. and Zhou, P.",
TITLE = "Rethinking Video Sentence Grounding from a Tracking Perspective With
Memory Network and Masked Attention",
JOURNAL = MultMed,
VOLUME = "26",
YEAR = "2024",
PAGES = "11204-11218",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236085"}
@article{bb241170,
AUTHOR = "Qi, Z.B. and Yuan, Y. and Ruan, X.W. and Wang, S.H. and Zhang, W.G. and Huang, Q.M.",
TITLE = "Collaborative Debias Strategy for Temporal Sentence Grounding in
Video",
JOURNAL = CirSysVideo,
VOLUME = "34",
YEAR = "2024",
NUMBER = "11",
MONTH = "November",
PAGES = "10972-10986",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236086"}
@article{bb241171,
AUTHOR = "Dong, J.X. and Yin, Z.Z.",
TITLE = "Graph-based Dense Event Grounding with relative positional encoding",
JOURNAL = CVIU,
VOLUME = "251",
YEAR = "2025",
PAGES = "104257",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236087"}
@article{bb241172,
AUTHOR = "Tang, K.F. and He, L.H. and Wang, N.N. and Gao, X.B.",
TITLE = "Dual Semantic Reconstruction Network for Weakly Supervised Temporal
Sentence Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "95-107",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236088"}
@article{bb241173,
AUTHOR = "Wang, C.L. and Feng, W.Q. and Lyu, S.C. and Cheng, G.L. and Li, X.T. and Liu, B.H. and Zhao, Q.",
TITLE = "A Masked Reference Token Supervision-Based Iterative Visual-Language
Framework for Robust Visual Grounding",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "1",
MONTH = "January",
PAGES = "75-90",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236089"}
@inproceedings{bb241174,
AUTHOR = "Li, M.H. and Wang, C.L. and Feng, W.Q. and Lyu, S.C. and Cheng, G.L. and Li, X.T. and Liu, B.H. and Zhao, Q.",
TITLE = "Iterative Robust Visual Grounding with Masked Reference based
Centerpoint Supervision",
BOOKTITLE = VLAR23,
YEAR = "2023",
PAGES = "4653-4658",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236090"}
@article{bb241175,
AUTHOR = "Liu, H. and Tan, Z.C. and Chen, Q. and Wei, Y.C. and Zhao, Y. and Wang, J.D.",
TITLE = "Unified Frequency-Assisted Transformer Framework for Detecting and
Grounding Multi-modal Manipulation",
JOURNAL = IJCV,
VOLUME = "133",
YEAR = "2025",
NUMBER = "3",
MONTH = "March",
PAGES = "1392-1409",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236091"}
@article{bb241176,
AUTHOR = "Ding, Y. and Wang, D. and Li, K. and Zhao, X.H. and Wang, Y.F.",
TITLE = "Visual grounding of remote sensing images with multi-dimensional
semantic-guidance",
JOURNAL = PRL,
VOLUME = "189",
YEAR = "2025",
PAGES = "85-91",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236092"}
@article{bb241177,
AUTHOR = "Li, T.Y. and Wang, C. and Tian, S. and Zhang, B. and Wu, F. and Tang, Y.X. and Zhang, H.",
TITLE = "TACMT: Text-aware cross-modal transformer for visual grounding on
high-resolution SAR images",
JOURNAL = PandRS,
VOLUME = "222",
YEAR = "2025",
PAGES = "152-166",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236093"}
@article{bb241178,
AUTHOR = "Han, T.T. and Wang, K. and Yu, J. and Zhao, S.C. and Fan, J.P.",
TITLE = "Adversarial temporal sentence grounding by learning from external
data",
JOURNAL = PR,
VOLUME = "165",
YEAR = "2025",
PAGES = "111621",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236094"}
@article{bb241179,
AUTHOR = "Guan, R.W. and Jia, L. and Yao, S. and Yang, F.Y.F. and Xu, S. and Purwanto, E. and Zhu, X.H. and Man, K.L. and Lim, E.G. and Smith, J. and Hu, X.M. and Yue, Y.T.",
TITLE = "WaterVG: Waterway Visual Grounding Based on Text-Guided Vision and
mmWave Radar",
JOURNAL = ITS,
VOLUME = "26",
YEAR = "2025",
NUMBER = "5",
MONTH = "May",
PAGES = "7275-7291",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236095"}
@article{bb241180,
AUTHOR = "Choudhury, S. and Kurkure, P. and Banerjee, B.",
TITLE = "Improving visual grounding in remote sensing images with adaptive
modality guidance",
JOURNAL = PandRS,
VOLUME = "224",
YEAR = "2025",
PAGES = "42-58",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236096"}
@article{bb241181,
AUTHOR = "Liu, K. and Qu, M.X. and Liu, Y. and Wei, Y.C. and Zhe, W.M. and Zhao, Y. and Liu, W.",
TITLE = "Single-Frame Supervision for Spatio-Temporal Video Grounding",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "7",
MONTH = "July",
PAGES = "5177-5191",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236097"}
@article{bb241182,
AUTHOR = "Li, Y.X. and Wang, Z. and Liang, W.",
TITLE = "R2G: Reasoning to ground in 3D scenes",
JOURNAL = PR,
VOLUME = "168",
YEAR = "2025",
PAGES = "111728",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236098"}
@article{bb241183,
AUTHOR = "Hu, J.J. and Guo, D. and Li, K. and Si, Z. and Yang, X. and Chang, X.J. and Wang, M.",
TITLE = "Unified Static and Dynamic Network: Efficient Temporal Filtering for
Video Grounding",
JOURNAL = PAMI,
VOLUME = "47",
YEAR = "2025",
NUMBER = "8",
MONTH = "August",
PAGES = "6445-6462",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236099"}
@article{bb241184,
AUTHOR = "Xie, M.H. and Wang, M.Z. and Li, H.F. and Zhang, Y.F. and Tao, D.P. and Yu, Z.T.",
TITLE = "Phrase Decoupling Cross-Modal Hierarchical Matching and Progressive
Position Correction for Visual Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "3979-3991",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236100"}
@article{bb241185,
AUTHOR = "Geng, L. and Yin, J.Q. and Chen, G. and Jia, Q.X.",
TITLE = "Pseudo-EV: Enhancing 3D Visual Grounding With Pseudo Embodied
Viewpoint",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "8",
MONTH = "August",
PAGES = "8031-8044",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236101"}
@article{bb241186,
AUTHOR = "Zhu, H. and Gao, T.Q. and Li, Z.X. and Chen, Z.P. and Li, Q. and Miao, K. and Hou, B. and Jiao, L.C.",
TITLE = "Cascaded Hierarchical Attention with Adaptive Fusion for Visual
Grounding in Remote Sensing",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "17",
PAGES = "2930",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236102"}
@article{bb241187,
AUTHOR = "Chi, H. and Qin, W.W. and Chen, X.Y. and Guo, W.X. and An, B.",
TITLE = "TVI-MFAN: A Text-Visual Interaction Multilevel Feature Alignment
Network for Visual Grounding in Remote Sensing",
JOURNAL = RS,
VOLUME = "17",
YEAR = "2025",
NUMBER = "17",
PAGES = "2993",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236103"}
@article{bb241188,
AUTHOR = "Liu, D. and Hu, W.",
TITLE = "Imperceptible Backdoor Attacks on Text-Guided 3D Scene Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "5466-5479",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236104"}
@article{bb241189,
AUTHOR = "Bu, Y.Q. and Wu, X. and Cai, Y. and Liu, Q. and Wang, T. and Huang, Q.",
TITLE = "Error-Aware Generative Reasoning for Zero-Shot Visual Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "4844-4855",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236105"}
@article{bb241190,
AUTHOR = "Qiao, G. and Yi, D. and Wu, L.X. and Wu, H.X. and Wang, J.Q.",
TITLE = "Enhancing Visual Aligning and Grounding for Aerial Vision-and-Dialog
Navigation",
JOURNAL = SPLetters,
VOLUME = "32",
YEAR = "2025",
PAGES = "2853-2857",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236106"}
@article{bb241191,
AUTHOR = "Ran, R. and Wei, J. and Zhou, Y.Y. and Guan, X. and Yang, Y. and Shen, H.T.",
TITLE = "HCFMN: Hierarchical Cross-Modal Fine-Grained Mining Network for
Temporal Sentence Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "6462-6474",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236107"}
@article{bb241192,
AUTHOR = "Wang, M.Z. and Li, H.F. and Zhang, Y.F. and Li, J.X. and Xie, M.H. and Tao, D.P.",
TITLE = "Dual-Task Mutual Reinforcing Embedded Joint Video Paragraph Retrieval
and Grounding",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "5879-5894",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236108"}
@article{bb241193,
AUTHOR = "Dong, L. and Zhang, H. and Zhang, H.J. and Huang, Y.F. and Ling, Z.H. and Qiao, Y. and Wang, L.M. and Wang, Y.",
TITLE = "Weakly Supervised Temporal Sentence Grounding via Positive Sample
Mining",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "10",
MONTH = "October",
PAGES = "10396-10409",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236109"}
@article{bb241194,
AUTHOR = "Zhu, Z.H. and Huang, Y.F. and Zhang, M.F. and Ouyang, L.Y. and Sato, Y.",
TITLE = "Prompt-Augmented Boundary Attentive Learning for Weakly Supervised
Temporal Sentence Grounding",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "11404-11415",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236110"}
@inproceedings{bb241195,
AUTHOR = "Huang, Y.F. and Yang, L. and Sato, Y.",
TITLE = "Weakly Supervised Temporal Sentence Grounding with Uncertainty-Guided
Self-training",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "18908-18918",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236111"}
@article{bb241196,
AUTHOR = "Xu, X.X. and Yuan, Y.T. and Zhang, Q.D. and Wu, W.H. and Jie, Z.Q. and Ma, L. and Wang, X.",
TITLE = "Weakly-Supervised 3D Visual Grounding Based on Visual Language
Alignment",
JOURNAL = MultMed,
VOLUME = "27",
YEAR = "2025",
PAGES = "7662-7674",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236112"}
@inproceedings{bb241197,
AUTHOR = "Liu, Y.F. and Wan, B. and Ma, L. and He, X.M.",
TITLE = "Relation-aware Instance Refinement for Weakly Supervised Visual
Grounding",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "5608-5617",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236113"}
@article{bb241198,
AUTHOR = "Ran, R. and Wei, J. and He, S.Y. and Zhou, Y.Y. and Wang, P. and Yang, Y. and Shen, H.T.",
TITLE = "Fine-Grained Alignment and Interaction for Video Grounding With
Cross-Modal Semantic Hierarchical Graph",
JOURNAL = CirSysVideo,
VOLUME = "35",
YEAR = "2025",
NUMBER = "11",
MONTH = "November",
PAGES = "11641-11654",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236114"}
@article{bb241199,
AUTHOR = "Wang, M.Z. and Li, H.F. and Zhang, Y.F. and Li, J.X. and Tao, D.P. and Yu, Z.T.",
TITLE = "Disentangling Inter- and Intra-Video Relations for Multi-Event
Video-Text Retrieval and Grounding",
JOURNAL = IP,
VOLUME = "34",
YEAR = "2025",
PAGES = "7558-7571",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vgr2.html#TT236115"}
Last update:Feb 26, 2026 at 10:58:24