@article{bb129600, AUTHOR = "Ren, Z.H. and Gou, S.P. and Guo, Z. and Mao, S.S. and Li, R.M.", TITLE = "A Mask-Guided Transformer Network with Topic Token for Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "14", YEAR = "2022", NUMBER = "12", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125643"} @article{bb129601, AUTHOR = "Ji, J.Y. and Ma, Y.W. and Sun, X.S. and Zhou, Y. and Wu, Y.J. and Ji, R.R.", TITLE = "Knowing What to Learn: A Metric-Oriented Focal Mechanism for Image Captioning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "4321-4335", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125644"} @article{bb129602, AUTHOR = "Li, X. and Zhang, W.K. and Sun, X. and Gao, X.", TITLE = "Semantic-meshed and content-guided transformer for image captioning", JOURNAL = IET-CV, VOLUME = "16", YEAR = "2022", NUMBER = "5", PAGES = "431-444", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125645"} @article{bb129603, AUTHOR = "Xian, T.T. and Li, Z.X. and Tang, Z.J. and Ma, H.F.", TITLE = "Adaptive Path Selection for Dynamic Image Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "9", MONTH = "September", PAGES = "5762-5775", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125646"} @article{bb129604, AUTHOR = "Cao, S. and An, G. and Zheng, Z.X. and Wang, Z.Y.", TITLE = "Vision-Enhanced and Consensus-Aware Transformer for Image Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "10", MONTH = "October", PAGES = "7005-7018", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125647"} @article{bb129605, AUTHOR = "Jiang, W.T. and Zhou, W. and Hu, H.F.", TITLE = "Double-Stream Position Learning Transformer Network for Image Captioning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "11", MONTH = "November", PAGES = "7706-7718", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125648"} @article{bb129606, AUTHOR = "Li, J.C. and Zhou, W. and Wang, K. and Hu, H.F.", TITLE = "Triple-Stream Commonsense Circulation Transformer Network for Image Captioning", JOURNAL = CVIU, VOLUME = "249", YEAR = "2024", PAGES = "104165", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125649"} @article{bb129607, AUTHOR = "Hu, J.T. and Yang, Y. and Yao, L. and An, Y.Z. and Pan, L.", TITLE = "Position-guided transformer for image captioning", JOURNAL = IVC, VOLUME = "128", YEAR = "2022", PAGES = "104575", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125650"} @article{bb129608, AUTHOR = "Wang, Z.G. and Shi, S. and Zhai, Z.R. and Wu, Y. and Yang, R.", TITLE = "ArCo: Attention-reinforced transformer with contrastive learning for image captioning", JOURNAL = IVC, VOLUME = "128", YEAR = "2022", PAGES = "104570", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125651"} @article{bb129609, AUTHOR = "Li, Z.X. and Wei, J. and Huang, F.C. and Ma, H.F.", TITLE = "Modeling graph-structured contexts for image captioning", JOURNAL = IVC, VOLUME = "129", YEAR = "2023", PAGES = "104591", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125652"} @article{bb129610, AUTHOR = "Zhang, J. and Xie, Y.S. and Ding, W.C. and Wang, Z.", TITLE = "Cross on Cross Attention: Deep Fusion Transformer for Image Captioning", JOURNAL = CirSysVideo, VOLUME = "33", YEAR = "2023", NUMBER = "8", MONTH = "August", PAGES = "4257-4268", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125653"} @article{bb129611, AUTHOR = "Lim, J.H. and Chan, C.S.", TITLE = "Mask-guided network for image captioning", JOURNAL = PRL, VOLUME = "173", YEAR = "2023", PAGES = "79-86", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125654"} @article{bb129612, AUTHOR = "Li, Z.X. and Su, Q. and Chen, T.Y.", TITLE = "External knowledge-assisted Transformer for image captioning", JOURNAL = IVC, VOLUME = "140", YEAR = "2023", PAGES = "104864", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125655"} @article{bb129613, AUTHOR = "Chen, J.Q.", TITLE = "Transform, contrast and tell: Coherent entity-aware multi-image captioning", JOURNAL = CVIU, VOLUME = "238", YEAR = "2024", PAGES = "103878", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125656"} @article{bb129614, AUTHOR = "Yang, X.B. and Tian, X. and Wu, J.S. and Yang, X.C. and Ma, S. and Qi, X. and Hou, Z.Q.", TITLE = "LLAFN-Generator: Learnable linear-attention with fast-normalization for large-scale image captioning", JOURNAL = CVIU, VOLUME = "248", YEAR = "2024", PAGES = "104088", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125657"} @article{bb129615, AUTHOR = "Yi, Y. and Liang, Y. and Kong, D. and Tang, Z.W. and Peng, J.B.", TITLE = "Tag-inferring and tag-guided Transformer for image captioning", JOURNAL = IET-CV, VOLUME = "18", YEAR = "2024", NUMBER = "6", PAGES = "801-812", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125658"} @inproceedings{bb129616, AUTHOR = "Song, J.Y. and Pan, R.J. and Zhou, J. and Yang, H.", TITLE = "M-rat: a Multi-grained Retrieval Augmentation Transformer for Image Captioning", BOOKTITLE = ACCV24, YEAR = "2024", PAGES = "III: 185-203", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125659"} @inproceedings{bb129617, AUTHOR = "Caffagni, D. and Barraco, M. and Cornia, M. and Baraldi, L. and Cucchiara, R.", TITLE = "Synthcap: Augmenting Transformers with Synthetic Data for Image Captioning", BOOKTITLE = CIAP23, YEAR = "2023", PAGES = "I:112-123", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125660"} @inproceedings{bb129618, AUTHOR = "Lou, L.S. and Lu, K. and Xue, J.", TITLE = "Improved Transformer with Parallel Encoders for Image Captioning", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "4072-4075", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125661"} @inproceedings{bb129619, AUTHOR = "Wang, Y.H. and Shang, L.", TITLE = "Generating Spatial-aware Captions for TextCaps", BOOKTITLE = "ICPR22", YEAR = "2022", PAGES = "379-385", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125662"} @inproceedings{bb129620, AUTHOR = "Feng, Y. and Maeda, K. and Ogawa, T. and Haseyama, M.", TITLE = "Human-Centric Image Retrieval with Gaze-Based Image Captioning", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "3828-3832", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125663"} @inproceedings{bb129621, AUTHOR = "Yang, X. and Wang, Y. and Chen, H. and Li, J.", TITLE = "CSTNET: Enhancing Global-To-Local Interactions for Image Captioning", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "1861-1865", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125664"} @inproceedings{bb129622, AUTHOR = "Nguyen, V.Q. and Suganuma, M. and Okatani, T.", TITLE = "GRIT: Faster and Better Image Captioning Transformer Using Dual Visual Features", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:167-184", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125665"} @inproceedings{bb129623, AUTHOR = "Vo, D.M. and Chen, H. and Sugimoto, A. and Nakayama, H.", TITLE = "NOC-REK: Novel Object Captioning with Retrieved Vocabulary from External Knowledge", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17979-17987", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125666"} @inproceedings{bb129624, AUTHOR = "Yuan, Z.H. and Yan, X. and Liao, Y.H. and Guo, Y. and Li, G.B. and Cui, S.G. and Li, Z.", TITLE = "X-Trans2Cap: Cross-Modal Knowledge Transfer using Transformer for 3D Dense Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "8553-8563", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125667"} @inproceedings{bb129625, AUTHOR = "Liu, B. and Wang, D. and Yang, X. and Zhou, Y. and Yao, R. and Shao, Z.W. and Zhao, J.Q.", TITLE = "Show, Deconfound and Tell: Image Captioning with Causal Inference", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "18020-18029", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125668"} @inproceedings{bb129626, AUTHOR = "Fang, Z.Y. and Wang, J.F. and Hu, X.W. and Liang, L. and Gan, Z. and Wang, L.J. and Yang, Y.Z. and Liu, Z.C.", TITLE = "Injecting Semantic Concepts into End-to-End Image Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17988-17998", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125669"} @inproceedings{bb129627, AUTHOR = "Li, Y. and Pan, Y.W. and Yao, T. and Mei, T.", TITLE = "Comprehending and Ordering Semantics for Image Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17969-17978", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125670"} @inproceedings{bb129628, AUTHOR = "Fei, Z.C. and Yan, X. and Wang, S.H. and Tian, Q.", TITLE = "DeeCap: Dynamic Early Exiting for Efficient Image Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "12206-12216", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125671"} @inproceedings{bb129629, AUTHOR = "Wu, M.R. and Zhang, X.Y. and Sun, X.S. and Zhou, Y. and Chen, C. and Gu, J.X. and Sun, X. and Ji, R.R.", TITLE = "DIFNet: Boosting Visual Information Flow for Image Captioning", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "17999-18008", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125672"} @inproceedings{bb129630, AUTHOR = "Rio Torto, I. and Cardoso, J.S. and Teixeira, L.F.", TITLE = "From Captions to Explanations: A Multimodal Transformer-based Architecture for Natural Language Explanation Generation", BOOKTITLE = IbPRIA22, YEAR = "2022", PAGES = "54-65", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125673"} @inproceedings{bb129631, AUTHOR = "Chen, H.S. and Wang, Y. and Yang, X. and Li, J.", TITLE = "Captioning Transformer With Scene Graph Guiding", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "2538-2542", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125674"} @inproceedings{bb129632, AUTHOR = "Zhang, X.Y. and Sun, X.S. and Luo, Y.P. and Ji, J.Y. and Zhou, Y. and Wu, Y.J. and Huang, F.Y. and Ji, R.R.", TITLE = "RSTNet: Captioning with Adaptive Attention on Visual and Non-Visual Words", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "15460-15469", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125675"} @inproceedings{bb129633, AUTHOR = "He, S. and Liao, W.T. and Tavakoli, H.R. and Yang, M. and Rosenhahn, B. and Pugeault, N.", TITLE = "Image Captioning Through Image Transformer", BOOKTITLE = ACCV20, YEAR = "2020", PAGES = "IV:153-169", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125676"} @inproceedings{bb129634, AUTHOR = "Cornia, M. and Stefanini, M. and Baraldi, L. and Cucchiara, R.", TITLE = "Meshed-Memory Transformer for Image Captioning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10575-10584", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125677"} @inproceedings{bb129635, AUTHOR = "Tran, A. and Mathews, A. and Xie, L.", TITLE = "Transform and Tell: Entity-Aware News Image Captioning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "13032-13042", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125678"} @inproceedings{bb129636, AUTHOR = "Li, G. and Zhu, L. and Liu, P. and Yang, Y.", TITLE = "Entangled Transformer for Image Captioning", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "8927-8936", BIBSOURCE = "http://www.visionbib.com/bibliography/match607tic2.html#TT125679"} @article{bb129637, AUTHOR = "Sharma, D. and Chattopadhyay, C.", TITLE = "High-level feature aggregation for fine-grained architectural floor plan retrieval", JOURNAL = IET-CV, VOLUME = "12", YEAR = "2018", NUMBER = "5", MONTH = "August", PAGES = "702-709", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125680"} @inproceedings{bb129638, AUTHOR = "Sharma, D. and Chattopadhyay, C. and Harit, G.", TITLE = "A unified framework for semantic matching of architectural floorplans", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2422-2427", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125681"} @article{bb129639, AUTHOR = "Ham, B. and Cho, M.S. and Schmid, C. and Ponce, J.", TITLE = "Proposal Flow: Semantic Correspondences from Object Proposals", JOURNAL = PAMI, VOLUME = "40", YEAR = "2018", NUMBER = "7", MONTH = "July", PAGES = "1711-1725", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125682"} @inproceedings{bb129640, AUTHOR = "Ham, B. and Cho, M.S. and Schmid, C. and Ponce, J.", TITLE = "Proposal Flow", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "3475-3484", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125683"} @article{bb129641, AUTHOR = "Xiao, T.H. and Liu, S.F. and de Mello, S. and Yu, Z.D. and Kautz, J. and Yang, M.H.", TITLE = "Learning Contrastive Representation for Semantic Correspondence", JOURNAL = IJCV, VOLUME = "130", YEAR = "2022", NUMBER = "5", MONTH = "May", PAGES = "1293-1309", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125684"} @article{bb129642, AUTHOR = "Yang, M.H. and Kautz, J. and Yu, Z.D. and de Mello, S. and Liu, S.F. and Xiao, T.H.", TITLE = "Learning Contrastive Representation for Semantic Correspondence", JOURNAL = IJCV, VOLUME = "130", YEAR = "2022", NUMBER = "6", MONTH = "June", PAGES = "1607-1607", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125684"} @inproceedings{bb129643, AUTHOR = "Yuan, W.T. and Eckart, B. and Kim, K. and Jampani, V. and Fox, D. and Kautz, J.", TITLE = "DeepGMR: Learning Latent Gaussian Mixture Models for Registration", BOOKTITLE = ECCV20, YEAR = "2020", PAGES = "V:733-750", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125685"} @inproceedings{bb129644, AUTHOR = "Eckart, B. and Kim, K. and Kautz, J.", TITLE = "HGMR: Hierarchical Gaussian Mixtures for Adaptive 3D Registration", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XV: 730-746", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125686"} @article{bb129645, AUTHOR = "He, J.F. and Zhang, T.Z. and Zheng, Y.H. and Xu, M.L. and Zhang, Y.D. and Wu, F.", TITLE = "Consistency Graph Modeling for Semantic Correspondence", JOURNAL = IP, VOLUME = "30", YEAR = "2021", PAGES = "4932-4946", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125687"} @article{bb129646, AUTHOR = "Jeon, S. and Kim, S. and Min, D.B. and Sohn, K.H.", TITLE = "Pyramidal Semantic Correspondence Networks", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "9102-9118", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125688"} @article{bb129647, AUTHOR = "Cao, C.Q. and Zhang, Y.N.", TITLE = "Learning to Compare Relation: Semantic Alignment for Few-Shot Learning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "1462-1474", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125689"} @article{bb129648, AUTHOR = "Cheng, J. and Hao, F.S. and Liu, L. and Tao, D.C.", TITLE = "Imposing Semantic Consistency of Local Descriptors for Few-Shot Learning", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "1587-1600", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125690"} @article{bb129649, AUTHOR = "Hao, F.S. and He, F.X. and Cheng, J. and Tao, D.C.", TITLE = "Global-Local Interplay in Semantic Alignment for Few-Shot Learning", JOURNAL = CirSysVideo, VOLUME = "32", YEAR = "2022", NUMBER = "7", MONTH = "July", PAGES = "4351-4363", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125691"} @inproceedings{bb129650, AUTHOR = "Hao, F.S. and He, F.X. and Cheng, J. and Wang, L. and Cao, J. and Tao, D.C.", TITLE = "Collect and Select: Semantic Alignment Metric Learning for Few-Shot Learning", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "8459-8468", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125692"} @article{bb129651, AUTHOR = "Liu, H. and Wang, T. and Li, Y.D. and Lang, C. and Jin, Y. and Ling, H.B.", TITLE = "Joint Graph Learning and Matching for Semantic Feature Correspondence", JOURNAL = PR, VOLUME = "134", YEAR = "2023", PAGES = "109059", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125693"} @article{bb129652, AUTHOR = "Sachdeva, R. and Cordeiro, F.R. and Belagiannis, V. and Reid, I.D. and Carneiro, G.", TITLE = "ScanMix: Learning from Severe Label Noise via Semantic Clustering and Semi-Supervised Learning", JOURNAL = PR, VOLUME = "134", YEAR = "2023", PAGES = "109121", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125694"} @article{bb129653, AUTHOR = "Xu, X. and Xu, X. and Shen, F.M. and Li, Y.J.", TITLE = "Semantic-Aligned Attention With Refining Feature Embedding for Few-Shot Image Classification", JOURNAL = ITS, VOLUME = "23", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "25458-25468", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125695"} @article{bb129654, AUTHOR = "Yang, Z.Q. and Zhang, Y.Q. and Du, Y.X. and Tong, C.", TITLE = "Semantic-aligned reinforced attention model for zero-shot learning", JOURNAL = IVC, VOLUME = "128", YEAR = "2022", PAGES = "104586", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125696"} @article{bb129655, AUTHOR = "Wang, J. and Zhang, Z.Q. and Shi, Z.H. and Cai, J.Y. and Ji, S.W. and Wu, F.", TITLE = "Duality-Induced Regularizer for Semantic Matching Knowledge Graph Embeddings", JOURNAL = PAMI, VOLUME = "45", YEAR = "2023", NUMBER = "2", MONTH = "February", PAGES = "1652-1667", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125697"} @article{bb129656, AUTHOR = "Liu, W.X. and Zhong, X. and Jia, X.M. and Jiang, K. and Lin, C.W.", TITLE = "Actor-Aware Alignment Network for Action Recognition", JOURNAL = SPLetters, VOLUME = "29", YEAR = "2022", PAGES = "2597-2601", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125698"} @article{bb129657, AUTHOR = "Wang, Z. and Fu, Z.H. and Guo, Y.L. and Li, Z. and Yu, Q.F.", TITLE = "Local-to-Global Cost Aggregation for Semantic Correspondence", JOURNAL = CirSysVideo, VOLUME = "33", YEAR = "2023", NUMBER = "3", MONTH = "March", PAGES = "1209-1222", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125699"} @article{bb129658, AUTHOR = "Xu, W.J. and Wang, J.N. and Wei, Z.W. and Peng, M. and Wu, Y.R.", TITLE = "Deep Semantic-Visual Alignment for zero-shot remote sensing image scene classification", JOURNAL = PandRS, VOLUME = "198", YEAR = "2023", PAGES = "140-152", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125700"} @article{bb129659, AUTHOR = "Yang, J.Q. and Shen, Q. and Xie, C.", TITLE = "Generation-based contrastive model with semantic alignment for generalized zero-shot learning", JOURNAL = IVC, VOLUME = "137", YEAR = "2023", PAGES = "104758", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125701"} @article{bb129660, AUTHOR = "Duan, Z.H. and Ma, Z. and Zhu, F.Q.", TITLE = "Unified Architecture Adaptation for Compressed Domain Semantic Inference", JOURNAL = CirSysVideo, VOLUME = "33", YEAR = "2023", NUMBER = "8", MONTH = "August", PAGES = "4108-4121", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125702"} @article{bb129661, AUTHOR = "Xu, H.Y. and Liao, J. and Liu, H.P. and Sun, Y.X.", TITLE = "Learning Semantic Alignment Using Global Features and Multi-Scale Confidence", JOURNAL = CirSysVideo, VOLUME = "34", YEAR = "2024", NUMBER = "2", MONTH = "February", PAGES = "897-910", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125703"} @article{bb129662, AUTHOR = "Liu, J. and Xie, J.L. and Zhou, F.Y. and He, S.F.", TITLE = "Triadic temporal-semantic alignment for weakly-supervised video moment retrieval", JOURNAL = PR, VOLUME = "156", YEAR = "2024", PAGES = "110819", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125704"} @article{bb129663, AUTHOR = "Zhang, T. and Fang, H. and Zhang, H. and Gao, J.L. and Lu, X. and Nie, X. and Yin, Y.L.", TITLE = "Learning Feature Semantic Matching for Spatio-Temporal Video Grounding", JOURNAL = MultMed, VOLUME = "26", YEAR = "2024", PAGES = "9268-9279", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125705"} @article{bb129664, AUTHOR = "Wu, R.J. and Guo, W. and Liu, Y. and Sun, C.H.", TITLE = "High-Precision Heterogeneous Satellite Image Manipulation Localization: Feature Point Rules and Semantic Similarity Measurement", JOURNAL = RS, VOLUME = "16", YEAR = "2024", NUMBER = "19", PAGES = "3719", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125706"} @article{bb129665, AUTHOR = "Giang, K.T. and Song, S. and Jo, S.", TITLE = "TopicFM+: Boosting Accuracy and Efficiency of Topic-Assisted Feature Matching", JOURNAL = IP, VOLUME = "33", YEAR = "2024", PAGES = "6016-6028", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125707"} @article{bb129666, AUTHOR = "Liao, G. and Zhou, K. and Bao, Z.Y. and Liu, K.L. and Li, Q.", TITLE = "OV-NeRF: Open-Vocabulary Neural Radiance Fields With Vision and Language Foundation Models for 3D Semantic Understanding", JOURNAL = CirSysVideo, VOLUME = "34", YEAR = "2024", NUMBER = "12", MONTH = "December", PAGES = "12923-12936", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125708"} @article{bb129667, AUTHOR = "Shi, W. and Zhu, R.H. and Li, S.", TITLE = "Unsupervised Class-Imbalanced Domain Adaptation With Pairwise Adversarial Training and Semantic Alignment", JOURNAL = CirSysVideo, VOLUME = "34", YEAR = "2024", NUMBER = "12", MONTH = "December", PAGES = "12411-12424", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125709"} @article{bb129668, AUTHOR = "Zhang, H. and Xu, L.M. and Lai, S.Q. and Shao, W.Q. and Zheng, N.N. and Luo, P. and Qiao, Y. and Zhang, K.P.", TITLE = "Open-Vocabulary Animal Keypoint Detection with Semantic-Feature Matching", JOURNAL = IJCV, VOLUME = "132", YEAR = "2024", NUMBER = "12", MONTH = "December", PAGES = "5741-5758", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125710"} @article{bb129669, AUTHOR = "Xu, L.M. and Li, H.Q. and Zheng, B. and Li, W.S. and Lv, J.C.", TITLE = "Deep Lifelong Cross-Modal Hashing", JOURNAL = CirSysVideo, VOLUME = "34", YEAR = "2024", NUMBER = "12", MONTH = "December", PAGES = "13478-13493", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125711"} @article{bb129670, AUTHOR = "Dong, M.P. and Li, F. and Li, Z.B. and Liu, X.", TITLE = "PRSN: Prototype resynthesis network with cross-image semantic alignment for few-shot image classification", JOURNAL = PR, VOLUME = "159", YEAR = "2025", PAGES = "111122", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125712"} @article{bb129671, AUTHOR = "Gonzalez, L.H.R. and Florez, S.L. and Gonzalez Briones, A. and de la Prieta, F.", TITLE = "Semantic scene understanding through advanced object context analysis in image", JOURNAL = CVIU, VOLUME = "252", YEAR = "2025", PAGES = "104299", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125713"} @article{bb129672, AUTHOR = "Shi, Y. and Li, R.X. and Gan, L. and Zhan, D.C. and Ye, H.J.", TITLE = "Generalized Conditional Similarity Learning via Semantic Matching", JOURNAL = PAMI, VOLUME = "47", YEAR = "2025", NUMBER = "5", MONTH = "May", PAGES = "3847-3862", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125714"} @inproceedings{bb129673, AUTHOR = "Ju, Y.C. and Hu, K.Z. and Zhang, G. and Zhang, G. and Jiang, M. and Xu, H.Z.", TITLE = "Robo-abc: Affordance Generalization Beyond Categories via Semantic Correspondence for Robot Manipulation", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XLI: 222-239", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125715"} @inproceedings{bb129674, AUTHOR = "Wang, P.Y. and Ikeda, T. and Lee, R. and Nishiwaki, K.", TITLE = "GS-Pose: Category-level Object Pose Estimation via Geometric and Semantic Correspondence", BOOKTITLE = ECCV24, YEAR = "2024", PAGES = "XXVII: 108-126", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125716"} @inproceedings{bb129675, AUTHOR = "Park, C. and Kim, S. and Park, J. and Cho, M.", TITLE = "Learning SO(3)-Invariant Semantic Correspondence via Local Shape Transform", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "22978-22987", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125717"} @inproceedings{bb129676, AUTHOR = "Mariotti, O. and Aodha, O.M. and Bilen, H.", TITLE = "Improving Semantic Correspondence with Viewpoint-Guided Spherical Maps", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "19521-19530", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125718"} @inproceedings{bb129677, AUTHOR = "Sun, Y.X. and Yin, Z.Y. and Wang, H.B. and Wang, Y. and Qiu, X.P. and Ge, W.F. and Zhang, W.Q.", TITLE = "Pixel-Level Semantic Correspondence Through Layout-Aware Representation Learning and Multi-Scale Matching Integration", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "17047-17056", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125719"} @inproceedings{bb129678, AUTHOR = "Park, J.H. and Lee, G. and Park, S. and Cho, S.I.", TITLE = "Not All Classes Stand on Same Embeddings: Calibrating a Semantic Distance with Metric Tensor", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "17722-17731", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125720"} @inproceedings{bb129679, AUTHOR = "Gu, Y.C. and Zhou, Y. and Wu, B. and Yu, L.C. and Liu, J.W. and Zhao, R. and Wu, J.Z.J. and Zhang, D.J.H. and Shou, M.Z. and Tang, K.", TITLE = "VideoSwap: Customized Video Subject Swapping with Interactive Semantic Point Correspondence", BOOKTITLE = CVPR24, YEAR = "2024", PAGES = "7621-7630", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125721"} @inproceedings{bb129680, AUTHOR = "Kim, S. and Min, J. and Cho, M.", TITLE = "Efficient Semantic Matching with Hypercolumn Correlation", BOOKTITLE = WACV24, YEAR = "2024", PAGES = "138-147", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125722"} @inproceedings{bb129681, AUTHOR = "Xie, X.J. and Liu, F. and Gai, S. and Huang, Z. and Hu, M.H. and Wang, A.", TITLE = "Hss: A Hierarchical Semantic Similarity Hard Negative Sampling Method for Dense Retrievers", BOOKTITLE = MMMod23, YEAR = "2023", PAGES = "II: 301-312", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125723"} @inproceedings{bb129682, AUTHOR = "Cai, R. and Tung, J. and Wang, Q.Q. and Averbuch Elor, H. and Hariharan, B. and Snavely, N.", TITLE = "Doppelgangers: Learning to Disambiguate Images of Similar Structures", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "34-44", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125724"} @inproceedings{bb129683, AUTHOR = "Huang, Y.W. and Sun, Y.X. and Lai, C.H. and Xu, Q. and Wang, X.M. and Shen, X.L. and Ge, W.F.", TITLE = "Weakly Supervised Learning of Semantic Correspondence through Cascaded Online Correspondence Refinement", BOOKTITLE = ICCV23, YEAR = "2023", PAGES = "16208-16217", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125725"} @inproceedings{bb129684, AUTHOR = "Shtedritski, A. and Vedaldi, A. and Rupprecth, C.", TITLE = "Learning Universal Semantic Correspondences with No Supervision and Automatic Data Curation", BOOKTITLE = LIMIT23, YEAR = "2023", PAGES = "933-943", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125726"} @inproceedings{bb129685, AUTHOR = "Tang, C.F. and Xie, L.X. and Zhang, X.P. and Hu, X.L. and Tian, Q.", TITLE = "Visual Recognition by Request", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "15265-15274", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125727"} @inproceedings{bb129686, AUTHOR = "Sun, Y.X. and Huang, Y.W. and Guo, H.J. and Zhao, Y.Z. and Wu, R.M. and Yu, Y.Z. and Ge, W.F. and Zhang, W.Q.", TITLE = "MISC210K: A Large-Scale Dataset for Multi-Instance Semantic Correspondence", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "7121-7130", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125728"} @inproceedings{bb129687, AUTHOR = "Sabir, A. and Moreno Noguer, F. and Padro, L.", TITLE = "Visual Semantic Relatedness Dataset for Image Captioning", BOOKTITLE = ODRUM23, YEAR = "2023", PAGES = "5598-5606", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125729"} @inproceedings{bb129688, AUTHOR = "Zeng, Z.Q. and Zhang, H. and Lu, R.Y. and Wang, D.S. and Chen, B. and Wang, Z.J.", TITLE = "ConZIC: Controllable Zero-shot Image Captioning by Sampling-Based Polishing", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23465-23476", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125730"} @inproceedings{bb129689, AUTHOR = "Luo, J.J. and Li, Y. and Pan, Y.W. and Yao, T. and Feng, J.L. and Chao, H.Y. and Mei, T.", TITLE = "Semantic-Conditional Diffusion Networks for Image Captioning*", BOOKTITLE = CVPR23, YEAR = "2023", PAGES = "23359-23368", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125731"} @inproceedings{bb129690, AUTHOR = "Bachard, T. and Tom, A.J. and Maugey, T.", TITLE = "Semantic Alignment for Multi-Item Compression", BOOKTITLE = ICIP22, YEAR = "2022", PAGES = "2841-2845", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125732"} @inproceedings{bb129691, AUTHOR = "Hu, Y.D. and Wang, R. and Zhang, K. and Gao, Y.", TITLE = "Semantic-Aware Fine-Grained Correspondence", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXI:97-115", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125733"} @inproceedings{bb129692, AUTHOR = "Kim, J. and Heo, B. and Yun, S. and Kim, S. and Han, D.Y.", TITLE = "Match Me If You Can: Semi-supervised Semantic Correspondence Learning with Unpaired Images", BOOKTITLE = ACCV24, YEAR = "2024", PAGES = "VI: 462-479", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125734"} @inproceedings{bb129693, AUTHOR = "Kim, J. and Ryoo, K. and Seo, J.Y. and Lee, G. and Kim, D. and Cho, H.S. and Kim, S.", TITLE = "Semi-Supervised Learning of Semantic Correspondence with Pseudo-Labels", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "19667-19677", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125735"} @inproceedings{bb129694, AUTHOR = "Kim, S. and Min, J. and Cho, M.", TITLE = "TransforMatcher: Match-to-Match Attention for Semantic Correspondence", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "8687-8697", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125736"} @inproceedings{bb129695, AUTHOR = "Ye, H.J. and Shi, Y. and Zhan, D.C.", TITLE = "Identifying Ambiguous Similarity Conditions via Semantic Matching", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "16589-16598", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125737"} @inproceedings{bb129696, AUTHOR = "Huang, S. and Yang, L. and He, B. and Zhang, S.Y. and He, X.M. and Shrivastava, A.", TITLE = "Learning Semantic Correspondence with Sparse Annotations", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XIV:267-284", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125738"} @inproceedings{bb129697, AUTHOR = "Aygun, M. and Aodha, O.M.", TITLE = "Demystifying Unsupervised Semantic Correspondence Estimation", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXX:125-142", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125739"} @inproceedings{bb129698, AUTHOR = "Li, X. and Fan, D.P. and Yang, F. and Luo, A. and Cheng, H. and Liu, Z.C.", TITLE = "Probabilistic Model Distillation for Semantic Correspondence", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "7501-7510", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125740"} @inproceedings{bb129699, AUTHOR = "Zhao, D.Y. and Song, Z.Y. and Ji, Z.H. and Zhao, G.M. and Ge, W.F. and Yu, Y.Z.", TITLE = "Multi-scale Matching Networks for Semantic Correspondence", BOOKTITLE = ICCV21, YEAR = "2021", PAGES = "3334-3344", BIBSOURCE = "http://www.visionbib.com/bibliography/match607seco3.html#TT125741"}