@article{bb133000, AUTHOR = "Shao, X.J. and Xiang, Z.L. and Li, Y.X. and Zhang, M.J.", TITLE = "Variational joint self-attention for image captioning", JOURNAL = IET-IPR, VOLUME = "16", YEAR = "2022", NUMBER = "8", PAGES = "2075-2086", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129040"} @article{bb133001, AUTHOR = "Ma, Y.W. and Ji, J.Y. and Sun, X.S. and Zhou, Y. and Ji, R.R.", TITLE = "Towards local visual modeling for image captioning", JOURNAL = PR, VOLUME = "138", YEAR = "2023", PAGES = "109420", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129041"} @article{bb133002, AUTHOR = "Barati, A. and Farsi, H. and Mohamadzadeh, S.", TITLE = "Integration of the latent variable knowledge into deep image captioning with Bayesian modeling", JOURNAL = IET-IPR, VOLUME = "17", YEAR = "2023", NUMBER = "7", PAGES = "2256-2271", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129042"} @article{bb133003, AUTHOR = "Ji, J.Y. and Huang, X.Y. and Sun, X.S. and Zhou, Y. and Luo, G. and Cao, L.J. and Liu, J.Z. and Shao, L. and Ji, R.R.", TITLE = "Multi-Branch Distance-Sensitive Self-Attention Network for Image Captioning", JOURNAL = MultMed, VOLUME = "25", YEAR = "2023", PAGES = "3962-3974", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129043"} @article{bb133004, AUTHOR = "Cornia, M. and Baraldi, L. and Tal, A. and Cucchiara, R.", TITLE = "Fully-attentive iterative networks for region-based controllable image and video captioning", JOURNAL = CVIU, VOLUME = "237", YEAR = "2023", PAGES = "103857", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129044"} @article{bb133005, AUTHOR = "Song, L.F. and Li, F. and Wang, Y. and Liu, Y. and Wang, Y.H. and Xiang, S.M.", TITLE = "Image captioning: Semantic selection unit with stacked residual attention", JOURNAL = IVC, VOLUME = "144", YEAR = "2024", PAGES = "104965", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129045"} @article{bb133006, AUTHOR = "Du, R. and Zhang, W.K. and Li, S. and Chen, J.L. and Guo, Z.", TITLE = "Spatial guided image captioning: Guiding attention with object's spatial interaction", JOURNAL = IET-IPR, VOLUME = "18", YEAR = "2024", NUMBER = "12", PAGES = "3368-3380", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129046"} @article{bb133007, AUTHOR = "Zhang, X.D. and Jia, A. and Ji, J.Z. and Qu, L.Q. and Ye, Q.X.", TITLE = "Intra- and Inter-Head Orthogonal Attention for Image Captioning", JOURNAL = IP, VOLUME = "34", YEAR = "2025", PAGES = "594-607", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129047"} @article{bb133008, AUTHOR = "Song, L.F. and Wang, Y. and Shi, L. and Yu, J.Z. and Li, F. and Xiang, S.M.", TITLE = "Transformer with token attention and attribute prediction for image captioning", JOURNAL = PRL, VOLUME = "188", YEAR = "2025", PAGES = "74-80", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129048"} @article{bb133009, AUTHOR = "Parseh, M.J. and Ghadiri, S.", TITLE = "Graph-based image captioning with semantic and spatial features", JOURNAL = SP:IC, VOLUME = "133", YEAR = "2025", PAGES = "117273", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129049"} @inproceedings{bb133010, AUTHOR = "Sui, J.H. and Yu, H.M. and Liang, X.Y. and Ping, P.", TITLE = "Image Caption Method Based on Graph Attention Network with Global Context", BOOKTITLE = ICIVC22, YEAR = "2022", PAGES = "480-487", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129050"} @inproceedings{bb133011, AUTHOR = "Popattia, M. and Rafi, M. and Qureshi, R. and Nawaz, S.", TITLE = "Guiding Attention using Partial-Order Relationships for Image Captioning", BOOKTITLE = MULA22, YEAR = "2022", PAGES = "4670-4679", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129051"} @inproceedings{bb133012, AUTHOR = "Deb, T. and Sadmanee, A. and Bhaumik, K.K. and Ali, A.A. and Amin, M.A. and Rahman, A.K.M.M.", TITLE = "Variational Stacked Local Attention Networks for Diverse Video Captioning", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "2493-2502", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129052"} @inproceedings{bb133013, AUTHOR = "Li, Z. and Tran, Q. and Mai, L. and Lin, Z. and Yuille, A.L.", TITLE = "Context-Aware Group Captioning via Self-Attention and Contrastive Features", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "3437-3447", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129053"} @inproceedings{bb133014, AUTHOR = "Guo, L. and Liu, J. and Zhu, X. and Yao, P. and Lu, S. and Lu, H.", TITLE = "Normalized and Geometry-Aware Self-Attention Network for Image Captioning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10324-10333", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129054"} @inproceedings{bb133015, AUTHOR = "Pan, Y. and Yao, T. and Li, Y. and Mei, T.", TITLE = "X-Linear Attention Networks for Image Captioning", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10968-10977", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129055"} @inproceedings{bb133016, AUTHOR = "Park, G. and Han, C. and Kim, D. and Yoon, W.J.", TITLE = "MHSAN: Multi-Head Self-Attention Network for Visual Semantic Embedding", BOOKTITLE = WACV20, YEAR = "2020", PAGES = "1507-1515", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129056"} @inproceedings{bb133017, AUTHOR = "He, S. and Tavakoli, H.R. and Borji, A. and Pugeault, N.", TITLE = "Human Attention in Image Captioning: Dataset and Analysis", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "8528-8537", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129057"} @inproceedings{bb133018, AUTHOR = "Huang, L. and Wang, W. and Chen, J. and Wei, X.", TITLE = "Attention on Attention for Image Captioning", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "4633-4642", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129058"} @inproceedings{bb133019, AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L.", TITLE = "Image Captioning Based on Visual and Semantic Attention", BOOKTITLE = MMMod20, YEAR = "2020", PAGES = "I:151-162", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129059"} @inproceedings{bb133020, AUTHOR = "Fukui, H. and Hirakawa, T. and Yamashita, T. and Fujiyoshi, H.", TITLE = "Attention Branch Network: Learning of Attention Mechanism for Visual Explanation", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "10697-10706", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129060"} @inproceedings{bb133021, AUTHOR = "Huang, Y. and Li, C. and Li, T. and Wan, W. and Chen, J.", TITLE = "Image Captioning with Attribute Refinement", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "1820-1824", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129061"} @inproceedings{bb133022, AUTHOR = "Shi, J. and Li, Y. and Wang, S.", TITLE = "Cascade Attention: Multiple Feature Based Learning for Image Captioning", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "1970-1974", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129062"} @inproceedings{bb133023, AUTHOR = "Xiao, H. and Shi, J.", TITLE = "A Novel Attribute Selection Mechanism for Video Captioning", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "619-623", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129063"} @inproceedings{bb133024, AUTHOR = "Wang, Q.Z. and Chan, A.B.", TITLE = "Gated Hierarchical Attention for Image Captioning", BOOKTITLE = ACCV18, YEAR = "2018", PAGES = "IV:21-37", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129064"} @inproceedings{bb133025, AUTHOR = "Wang, W.X. and Chen, Z.H. and Hu, H.F.", TITLE = "Multivariate Attention Network for Image Captioning", BOOKTITLE = ACCV18, YEAR = "2018", PAGES = "VI:587-602", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129065"} @inproceedings{bb133026, AUTHOR = "Ghanimifard, M. and Dobnik, S.", TITLE = "Knowing When to Look for What and Where: Evaluating Generation of Spatial Descriptions with Adaptive Attention", BOOKTITLE = VL18, YEAR = "2018", PAGES = "IV:153-161", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129066"} @inproceedings{bb133027, AUTHOR = "Khademi, M. and Schulte, O.", TITLE = "Image Caption Generation with Hierarchical Contextual Visual Spatial Attention", BOOKTITLE = Cognitive18, YEAR = "2018", PAGES = "2024-20248", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129067"} @inproceedings{bb133028, AUTHOR = "Wang, F. and Gong, X. and Huang, L.", TITLE = "Time-Dependent Pre-attention Model for Image Captioning", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "3297-3302", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129068"} @inproceedings{bb133029, AUTHOR = "Chen, S. and Zhao, Q.", TITLE = "Boosted Attention: Leveraging Human Attention for Image Captioning", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "XI: 72-88", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129069"} @inproceedings{bb133030, AUTHOR = "Fang, F. and Wang, H. and Tang, P.", TITLE = "Image Captioning with Word Level Attention", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "1278-1282", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129070"} @inproceedings{bb133031, AUTHOR = "Zhu, Z. and Xue, Z. and Yuan, Z.", TITLE = "Topic-Guided Attention for Image Captioning", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "2615-2619", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129071"} @inproceedings{bb133032, AUTHOR = "Pedersoli, M. and Lucas, T. and Schmid, C. and Verbeek, J.", TITLE = "Areas of Attention for Image Captioning", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "1251-1259", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129072"} @inproceedings{bb133033, AUTHOR = "Tavakoliy, H.R. and Shetty, R. and Borji, A. and Laaksonen, J.", TITLE = "Paying Attention to Descriptions Generated by Image Captioning Models", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "2506-2515", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129073"} @inproceedings{bb133034, AUTHOR = "Lu, J. and Xiong, C. and Parikh, D. and Socher, R.", TITLE = "Knowing When to Look: Adaptive Attention via a Visual Sentinel for Image Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "3242-3250", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129074"} @inproceedings{bb133035, AUTHOR = "Chen, L. and Zhang, H. and Xiao, J. and Nie, L. and Shao, J. and Liu, W. and Chua, T.S.", TITLE = "SCA-CNN: Spatial and Channel-Wise Attention in Convolutional Networks for Image Captioning", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "6298-6306", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129075"} @inproceedings{bb133036, AUTHOR = "Zanfir, M. and Marinoiu, E. and Sminchisescu, C.", TITLE = "Spatio-Temporal Attention Models for Grounded Video Captioning", BOOKTITLE = ACCV16, YEAR = "2016", PAGES = "IV: 104-119", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129076"} @inproceedings{bb133037, AUTHOR = "Chen, T.H. and Zeng, K.H. and Hsu, W.T. and Sun, M.", TITLE = "Video Captioning via Sentence Augmentation and Spatio-Temporal Attention", BOOKTITLE = Assist16, YEAR = "2016", PAGES = "I: 269-286", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129077"} @inproceedings{bb133038, AUTHOR = "Chen, T.L. and Zhang, Z.P. and You, Q.Z. and Fang, C. and Wang, Z.W. and Jin, H.L. and Luo, J.B.", TITLE = "'Factual' or 'Emotional': Stylized Image Captioning with Adaptive Learning and Attention", BOOKTITLE = ECCV18, YEAR = "2018", PAGES = "X: 527-543", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129078"} @inproceedings{bb133039, AUTHOR = "You, Q.Z. and Jin, H.L. and Wang, Z.W. and Fang, C. and Luo, J.B.", TITLE = "Image Captioning with Semantic Attention", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "4651-4659", BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129079"} @article{bb133040, AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.", TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation", JOURNAL = GeoRS, VOLUME = "56", YEAR = "2018", NUMBER = "4", MONTH = "April", PAGES = "2183-2195", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129080"} @article{bb133041, AUTHOR = "Zhang, X.R. and Wang, X. and Tang, X. and Zhou, H.Y. and Li, C.", TITLE = "Description Generation for Remote Sensing Images Using Attribute Attention Mechanism", JOURNAL = RS, VOLUME = "11", YEAR = "2019", NUMBER = "6", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129081"} @article{bb133042, AUTHOR = "Zhang, Z.Y. and Diao, W.H. and Zhang, W.K. and Yan, M.L. and Gao, X. and Sun, X.", TITLE = "LAM: Remote Sensing Image Captioning with Label-Attention Mechanism", JOURNAL = RS, VOLUME = "11", YEAR = "2019", NUMBER = "20", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129082"} @article{bb133043, AUTHOR = "Fu, K. and Li, Y. and Zhang, W.K. and Yu, H.F. and Sun, X.", TITLE = "Boosting Memory with a Persistent Memory Mechanism for Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "12", YEAR = "2020", NUMBER = "11", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129083"} @article{bb133044, AUTHOR = "Lu, X. and Wang, B. and Zheng, X.", TITLE = "Sound Active Attention Framework for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "58", YEAR = "2020", NUMBER = "3", MONTH = "March", PAGES = "1985-2000", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129084"} @article{bb133045, AUTHOR = "Li, Y.Y. and Fang, S.K. and Jiao, L.C. and Liu, R.J. and Shang, R.H.", TITLE = "A Multi-Level Attention Model for Remote Sensing Image Captions", JOURNAL = RS, VOLUME = "12", YEAR = "2020", NUMBER = "6", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129085"} @article{bb133046, AUTHOR = "Li, X.L. and Zhang, X.T. and Huang, W. and Wang, Q.", TITLE = "Truncation Cross Entropy Loss for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "6", MONTH = "June", PAGES = "5246-5257", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129086"} @article{bb133047, AUTHOR = "Sumbul, G. and Nayak, S. and Demir, B.", TITLE = "SD-RSIC: Summarization-Driven Deep Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "8", MONTH = "August", PAGES = "6922-6934", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129087"} @article{bb133048, AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.", TITLE = "Word-Sentence Framework for Remote Sensing Image Captioning", JOURNAL = GeoRS, VOLUME = "59", YEAR = "2021", NUMBER = "12", MONTH = "December", PAGES = "10532-10543", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129088"} @article{bb133049, AUTHOR = "Yang, Q.Q. and Ni, Z.H. and Ren, P.", TITLE = "Meta captioning: A meta learning based remote sensing image captioning framework", JOURNAL = PandRS, VOLUME = "186", YEAR = "2022", PAGES = "190-200", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129089"} @article{bb133050, AUTHOR = "Liu, Z.Y. and Dong, A.M. and Yu, J.G. and Han, Y.B. and Zhou, Y. and Zhao, K.", TITLE = "Scene classification for remote sensing images with self-attention augmented CNN", JOURNAL = IET-IPR, VOLUME = "16", YEAR = "2022", NUMBER = "11", PAGES = "3085-3096", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129090"} @article{bb133051, AUTHOR = "Zhou, H. and Du, X.P. and Xia, L. and Li, S.", TITLE = "Self-Learning for Few-Shot Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "14", YEAR = "2022", NUMBER = "18", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129091"} @article{bb133052, AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.", TITLE = "GLCM: Global-Local Captioning Model for Remote Sensing Image Captioning", JOURNAL = Cyber, VOLUME = "53", YEAR = "2023", NUMBER = "11", MONTH = "November", PAGES = "6910-6922", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129092"} @article{bb133053, AUTHOR = "Cheng, Q. and Xu, Y.Q. and Huang, Z.Y.", TITLE = "VCC-DiffNet: Visual Conditional Control Diffusion Network for Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "16", YEAR = "2024", NUMBER = "16", PAGES = "2961", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129093"} @article{bb133054, AUTHOR = "Li, Y.P. and Zhang, X.R. and Zhang, T.Y. and Wang, G.C. and Wang, X.L. and Li, S.", TITLE = "A Patch-Level Region-Aware Module with a Multi-Label Framework for Remote Sensing Image Captioning", JOURNAL = RS, VOLUME = "16", YEAR = "2024", NUMBER = "21", PAGES = "3987", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129094"} @article{bb133055, AUTHOR = "Zhang, K. and Li, P. and Wang, J.Q.", TITLE = "A Review of Deep Learning-Based Remote Sensing Image Caption: Methods, Models, Comparisons and Future Directions", JOURNAL = RS, VOLUME = "16", YEAR = "2024", NUMBER = "21", PAGES = "4113", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129095"} @article{bb133056, AUTHOR = "Leng, G. and Xiong, Y.J. and Qiu, C.P. and Guo, C.Z.", TITLE = "Discrete diffusion models with Refined Language-Image Pre-trained representations for remote sensing image captioning", JOURNAL = PRL, VOLUME = "186", YEAR = "2024", PAGES = "164-169", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129096"} @article{bb133057, AUTHOR = "Guo, Z. and Liu, H.M. and Ren, Z. and Jiao, L.C. and Gou, S.P. and Li, R.M.", TITLE = "Attribute-Based Learning for Remote Sensing Image Captioning in Unseen Scenes", JOURNAL = RS, VOLUME = "17", YEAR = "2025", NUMBER = "7", PAGES = "1237", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129097"} @inproceedings{bb133058, AUTHOR = "Wei, Y.C. and Li, L. and Geng, S.L.", TITLE = "Remote Sensing Image Captioning Using Hire-MLP", BOOKTITLE = CVIDL23, YEAR = "2023", PAGES = "109-112", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129098"} @inproceedings{bb133059, AUTHOR = "Chavhan, R. and Banerjee, B. and Zhu, X.X. and Chaudhuri, S.", TITLE = "A Novel Actor Dual-Critic Model for Remote Sensing Image Captioning", BOOKTITLE = ICPR21, YEAR = "2021", PAGES = "4918-4925", BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129099"} @article{bb133060, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "Dense Sampling Low-Level Statistics of Local Features", JOURNAL = IEICE, VOLUME = "E93-D", YEAR = "2010", NUMBER = "7", MONTH = "July", PAGES = "1727-1736", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129100"} @inproceedings{bb133061, AUTHOR = "Kuniyoshi, Y. and Harada, T. and Nakayama, H.", TITLE = "Dense Sampling Low-Level Statistics of Local Features", BOOKTITLE = CIVR09, YEAR = "2009", PAGES = "Article No 17", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129100"} @inproceedings{bb133062, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "Global Gaussian approach for scene categorization using information geometry", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "2336-2343", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129101"} @inproceedings{bb133063, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "AI Goggles: Real-time Description and Retrieval in the Real World with Online Learning", BOOKTITLE = CRV09, YEAR = "2009", PAGES = "184-191", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129102"} @inproceedings{bb133064, AUTHOR = "Ushiku, Y. and Yamaguchi, M. and Mukuta, Y. and Harada, T.", TITLE = "Common Subspace for Model and Similarity: Phrase Learning for Caption Generation from Images", BOOKTITLE = ICCV15, YEAR = "2015", PAGES = "2668-2676", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129103"} @inproceedings{bb133065, AUTHOR = "Harada, T. and Nakayama, H. and Kuniyoshi, Y.", TITLE = "Improving Local Descriptors by Embedding Global and Local Spatial Information", BOOKTITLE = ECCV10, YEAR = "2010", PAGES = "IV: 736-749", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129104"} @inproceedings{bb133066, AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.", TITLE = "Evaluation of dimensionality reduction methods for image auto-annotation", BOOKTITLE = BMVC10, YEAR = "2010", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129105"} @inproceedings{bb133067, AUTHOR = "Jin, J. and Nakayama, H.", TITLE = "Annotation order matters: Recurrent Image Annotator for arbitrary length image tagging", BOOKTITLE = ICPR16, YEAR = "2016", PAGES = "2452-2457", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129106"} @article{bb133068, AUTHOR = "Tariq, A. and Foroosh, H.", TITLE = "A Context-Driven Extractive Framework for Generating Realistic Image Descriptions", JOURNAL = IP, VOLUME = "26", YEAR = "2017", NUMBER = "2", MONTH = "February", PAGES = "619-632", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129107"} @article{bb133069, AUTHOR = "Cheng, Q. and Zhang, Q. and Fu, P. and Tu, C.H. and Li, S.", TITLE = "A survey and analysis on automatic image annotation", JOURNAL = PR, VOLUME = "79", YEAR = "2018", PAGES = "242-259", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129108"} @article{bb133070, AUTHOR = "Ben Rejeb, I. and Ouni, S. and Barhoumi, W. and Zagrouba, E.", TITLE = "Fuzzy VA-Files for multi-label image annotation based on visual content of regions", JOURNAL = SIViP, VOLUME = "12", YEAR = "2018", NUMBER = "5", MONTH = "July", PAGES = "877-884", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129109"} @article{bb133071, AUTHOR = "Helmy, T.", TITLE = "A Generic Framework for Semantic Annotation of Images", JOURNAL = IJIG, VOLUME = "18", YEAR = "2018", NUMBER = "3", MONTH = "July", PAGES = "Article 1850013", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129110"} @article{bb133072, AUTHOR = "Hu, J. and Lam, K.M. and Lou, P. and Liu, Q. and Deng, W.P.", TITLE = "Can a machine have two systems for recognition, like human beings?", JOURNAL = JVCIR, VOLUME = "56", YEAR = "2018", PAGES = "275-286", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129111"} @article{bb133073, AUTHOR = "Bhagat, P.K. and Choudhary, P.", TITLE = "Image annotation: Then and now", JOURNAL = IVC, VOLUME = "80", YEAR = "2018", PAGES = "1-23", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129112"} @article{bb133074, AUTHOR = "Bazrafkan, S. and Javidnia, H. and Corcoran, P.", TITLE = "Latent space mapping for generation of object elements with corresponding data annotation", JOURNAL = PRL, VOLUME = "116", YEAR = "2018", PAGES = "179-186", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129113"} @article{bb133075, AUTHOR = "Jiu, M.Y. and Sahbi, H.", TITLE = "Deep representation design from deep kernel networks", JOURNAL = PR, VOLUME = "88", YEAR = "2019", PAGES = "447-457", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129114"} @article{bb133076, AUTHOR = "Foumani, S.N.M. and Nickabadi, A.", TITLE = "A probabilistic topic model using deep visual word representation for simultaneous image classification and annotation", JOURNAL = JVCIR, VOLUME = "59", YEAR = "2019", PAGES = "195-203", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129115"} @article{bb133077, AUTHOR = "Zhang, J.J. and Wu, Q. and Zhang, J. and Shen, C.H. and Lu, J.F. and Wu, Q.A.", TITLE = "Heritage image annotation via collective knowledge", JOURNAL = PR, VOLUME = "93", YEAR = "2019", PAGES = "204-214", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129116"} @article{bb133078, AUTHOR = "Verma, Y.", TITLE = "Diverse image annotation with missing labels", JOURNAL = PR, VOLUME = "93", YEAR = "2019", PAGES = "470-484", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129117"} @article{bb133079, AUTHOR = "Markatopoulou, F. and Mezaris, V. and Patras, I.", TITLE = "Implicit and Explicit Concept Relations in Deep Neural Networks for Multi-Label Video/Image Annotation", JOURNAL = CirSysVideo, VOLUME = "29", YEAR = "2019", NUMBER = "6", MONTH = "June", PAGES = "1631-1644", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129118"} @article{bb133080, AUTHOR = "Laib, L. and Allili, M.S. and Ait Aoudia, S.", TITLE = "A probabilistic topic model for event-based image classification and multi-label annotation", JOURNAL = SP:IC, VOLUME = "76", YEAR = "2019", PAGES = "283-294", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129119"} @article{bb133081, AUTHOR = "Olaode, A. and Naghdy, G.", TITLE = "Review of the application of machine learning to the automatic semantic annotation of images", JOURNAL = IET-IPR, VOLUME = "13", YEAR = "2019", NUMBER = "8", MONTH = "June", PAGES = "1232-1245", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129120"} @article{bb133082, AUTHOR = "Zhang, C.J. and Cheng, J. and Tian, Q.", TITLE = "Multiview, Few-Labeled Object Categorization by Predicting Labels With View Consistency", JOURNAL = Cyber, VOLUME = "49", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "3834-3843", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129121"} @article{bb133083, AUTHOR = "Tang, C. and Liu, X.W. and Wang, P.C. and Zhang, C.Q. and Li, M.M. and Wang, L.Z.", TITLE = "Adaptive Hypergraph Embedded Semi-Supervised Multi-Label Image Annotation", JOURNAL = MultMed, VOLUME = "21", YEAR = "2019", NUMBER = "11", MONTH = "November", PAGES = "2837-2849", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129122"} @article{bb133084, AUTHOR = "Mundnich, K. and Booth, B.M. and Girault, B. and Narayanan, S.", TITLE = "Generating labels for regression of subjective constructs using triplet embeddings", JOURNAL = PRL, VOLUME = "128", YEAR = "2019", PAGES = "385-392", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129123"} @article{bb133085, AUTHOR = "Chaudhary, C. and Goyal, P. and Prasad, D.N. and Chen, Y.P.", TITLE = "Enhancing the Quality of Image Tagging Using a Visio-Textual Knowledge Base", JOURNAL = MultMed, VOLUME = "22", YEAR = "2020", NUMBER = "4", MONTH = "April", PAGES = "897-911", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129124"} @article{bb133086, AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.", TITLE = "Architecture to improve the accuracy of automatic image annotation systems", JOURNAL = IET-CV, VOLUME = "14", YEAR = "2020", NUMBER = "5", MONTH = "August", PAGES = "214-223", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129125"} @article{bb133087, AUTHOR = "Theodosiou, Z. and Tsapatsoulis, N.", TITLE = "Image annotation: the effects of content, lexicon and annotation method", JOURNAL = MultInfoRetr, VOLUME = "9", YEAR = "2020", NUMBER = "3", MONTH = "September", PAGES = "191-203", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129126"} @article{bb133088, AUTHOR = "Haghighi, F. and Taher, M.R.H. and Zhou, Z.W. and Gotway, M.B. and Liang, J.M.", TITLE = "Transferable Visual Words: Exploiting the Semantics of Anatomical Patterns for Self-Supervised Learning", JOURNAL = MedImg, VOLUME = "40", YEAR = "2021", NUMBER = "10", MONTH = "October", PAGES = "2857-2868", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129127"} @article{bb133089, AUTHOR = "Hochberg, D.C. and Greenspan, H. and Giryes, R.", TITLE = "A Self Supervised StyleGAN for Image Annotation and Classification With Extremely Limited Labels", JOURNAL = MedImg, VOLUME = "41", YEAR = "2022", NUMBER = "12", MONTH = "December", PAGES = "3509-3519", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129128"} @inproceedings{bb133090, AUTHOR = "Lahtinen, T. and Turtiainen, H. and Costin, A.", TITLE = "Brima: Low-Overhead Browser-Only Image Annotation Tool (Preprint)", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "2633-2637", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129129"} @inproceedings{bb133091, AUTHOR = "Lotfi, F. and Jamzad, M. and Beigy, H.", TITLE = "Automatic Image Annotation using Tag Relations and Graph Convolutional Networks", BOOKTITLE = IPRIA21, YEAR = "2021", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129130"} @inproceedings{bb133092, AUTHOR = "Chen, X.Y. and Jiang, M. and Zhao, Q.", TITLE = "Self-Distillation for Few-Shot Image Captioning", BOOKTITLE = WACV21, YEAR = "2021", PAGES = "545-555", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129131"} @inproceedings{bb133093, AUTHOR = "Jiu, M. and Sahbi, H.", TITLE = "End-to-End Deep Kernel Map Design for Image Annotation", BOOKTITLE = ICIP20, YEAR = "2020", PAGES = "1546-1550", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129132"} @inproceedings{bb133094, AUTHOR = "Hu, H. and Misra, I. and van der Maaten, L.", TITLE = "Evaluating Text-to-Image Matching using Binary Image Selection (BISON)", BOOKTITLE = CLVL19, YEAR = "2019", PAGES = "1887-1890", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129133"} @inproceedings{bb133095, AUTHOR = "Gupta, T. and Schwing, A.G. and Hoiem, D.", TITLE = "ViCo: Word Embeddings From Visual Co-Occurrences", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "7424-7433", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129134"} @inproceedings{bb133096, AUTHOR = "Bracha, L. and Chechik, G.", TITLE = "Informative Object Annotations: Tell Me Something I Don't Know", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "12499-12507", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129135"} @inproceedings{bb133097, AUTHOR = "Rapson, C.J. and Seet, B. and Naeem, M.A. and Lee, J.E. and Al Sarayreh, M. and Klette, R.", TITLE = "Reducing the Pain: A Novel Tool for Efficient Ground-Truth Labelling in Images", BOOKTITLE = IVCNZ18, YEAR = "2018", PAGES = "1-9", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129136"} @inproceedings{bb133098, AUTHOR = "Wu, B.Y. and Chen, W.D. and Sun, P. and Liu, W. and Ghanem, B. and Lyu, S.W.", TITLE = "Tagging Like Humans: Diverse and Distinct Image Annotation", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "7967-7975", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129137"} @inproceedings{bb133099, AUTHOR = "Wu, X.J. and Zhang, L. and Li, F.Z. and Wang, B.J.", TITLE = "A Novel Model for Multi-label Image Annotation", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "1953-1958", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129138"}