@article{bb133000,
        AUTHOR = "Shao, X.J. and Xiang, Z.L. and Li, Y.X. and Zhang, M.J.",
        TITLE = "Variational joint self-attention for image captioning",
        JOURNAL = IET-IPR,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "8",
        PAGES = "2075-2086",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129040"}

@article{bb133001,
        AUTHOR = "Ma, Y.W. and Ji, J.Y. and Sun, X.S. and Zhou, Y. and Ji, R.R.",
        TITLE = "Towards local visual modeling for image captioning",
        JOURNAL = PR,
        VOLUME = "138",
        YEAR = "2023",
        PAGES = "109420",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129041"}

@article{bb133002,
        AUTHOR = "Barati, A. and Farsi, H. and Mohamadzadeh, S.",
        TITLE = "Integration of the latent variable knowledge into deep image
captioning with Bayesian modeling",
        JOURNAL = IET-IPR,
        VOLUME = "17",
        YEAR = "2023",
        NUMBER = "7",
        PAGES = "2256-2271",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129042"}

@article{bb133003,
        AUTHOR = "Ji, J.Y. and Huang, X.Y. and Sun, X.S. and Zhou, Y. and Luo, G. and Cao, L.J. and Liu, J.Z. and Shao, L. and Ji, R.R.",
        TITLE = "Multi-Branch Distance-Sensitive Self-Attention Network for Image
Captioning",
        JOURNAL = MultMed,
        VOLUME = "25",
        YEAR = "2023",
        PAGES = "3962-3974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129043"}

@article{bb133004,
        AUTHOR = "Cornia, M. and Baraldi, L. and Tal, A. and Cucchiara, R.",
        TITLE = "Fully-attentive iterative networks for region-based controllable
image and video captioning",
        JOURNAL = CVIU,
        VOLUME = "237",
        YEAR = "2023",
        PAGES = "103857",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129044"}

@article{bb133005,
        AUTHOR = "Song, L.F. and Li, F. and Wang, Y. and Liu, Y. and Wang, Y.H. and Xiang, S.M.",
        TITLE = "Image captioning: Semantic selection unit with stacked residual
attention",
        JOURNAL = IVC,
        VOLUME = "144",
        YEAR = "2024",
        PAGES = "104965",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129045"}

@article{bb133006,
        AUTHOR = "Du, R. and Zhang, W.K. and Li, S. and Chen, J.L. and Guo, Z.",
        TITLE = "Spatial guided image captioning: Guiding attention with object's
spatial interaction",
        JOURNAL = IET-IPR,
        VOLUME = "18",
        YEAR = "2024",
        NUMBER = "12",
        PAGES = "3368-3380",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129046"}

@article{bb133007,
        AUTHOR = "Zhang, X.D. and Jia, A. and Ji, J.Z. and Qu, L.Q. and Ye, Q.X.",
        TITLE = "Intra- and Inter-Head Orthogonal Attention for Image Captioning",
        JOURNAL = IP,
        VOLUME = "34",
        YEAR = "2025",
        PAGES = "594-607",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129047"}

@article{bb133008,
        AUTHOR = "Song, L.F. and Wang, Y. and Shi, L. and Yu, J.Z. and Li, F. and Xiang, S.M.",
        TITLE = "Transformer with token attention and attribute prediction for image
captioning",
        JOURNAL = PRL,
        VOLUME = "188",
        YEAR = "2025",
        PAGES = "74-80",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129048"}

@article{bb133009,
        AUTHOR = "Parseh, M.J. and Ghadiri, S.",
        TITLE = "Graph-based image captioning with semantic and spatial features",
        JOURNAL = SP:IC,
        VOLUME = "133",
        YEAR = "2025",
        PAGES = "117273",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129049"}

@inproceedings{bb133010,
        AUTHOR = "Sui, J.H. and Yu, H.M. and Liang, X.Y. and Ping, P.",
        TITLE = "Image Caption Method Based on Graph Attention Network with Global
Context",
        BOOKTITLE = ICIVC22,
        YEAR = "2022",
        PAGES = "480-487",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129050"}

@inproceedings{bb133011,
        AUTHOR = "Popattia, M. and Rafi, M. and Qureshi, R. and Nawaz, S.",
        TITLE = "Guiding Attention using Partial-Order Relationships for Image
Captioning",
        BOOKTITLE = MULA22,
        YEAR = "2022",
        PAGES = "4670-4679",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129051"}

@inproceedings{bb133012,
        AUTHOR = "Deb, T. and Sadmanee, A. and Bhaumik, K.K. and Ali, A.A. and Amin, M.A. and Rahman, A.K.M.M.",
        TITLE = "Variational Stacked Local Attention Networks for Diverse Video
Captioning",
        BOOKTITLE = WACV22,
        YEAR = "2022",
        PAGES = "2493-2502",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129052"}

@inproceedings{bb133013,
        AUTHOR = "Li, Z. and Tran, Q. and Mai, L. and Lin, Z. and Yuille, A.L.",
        TITLE = "Context-Aware Group Captioning via Self-Attention and Contrastive
Features",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "3437-3447",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129053"}

@inproceedings{bb133014,
        AUTHOR = "Guo, L. and Liu, J. and Zhu, X. and Yao, P. and Lu, S. and Lu, H.",
        TITLE = "Normalized and Geometry-Aware Self-Attention Network for Image
Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10324-10333",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129054"}

@inproceedings{bb133015,
        AUTHOR = "Pan, Y. and Yao, T. and Li, Y. and Mei, T.",
        TITLE = "X-Linear Attention Networks for Image Captioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10968-10977",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129055"}

@inproceedings{bb133016,
        AUTHOR = "Park, G. and Han, C. and Kim, D. and Yoon, W.J.",
        TITLE = "MHSAN: Multi-Head Self-Attention Network for Visual Semantic
Embedding",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1507-1515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129056"}

@inproceedings{bb133017,
        AUTHOR = "He, S. and Tavakoli, H.R. and Borji, A. and Pugeault, N.",
        TITLE = "Human Attention in Image Captioning: Dataset and Analysis",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "8528-8537",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129057"}

@inproceedings{bb133018,
        AUTHOR = "Huang, L. and Wang, W. and Chen, J. and Wei, X.",
        TITLE = "Attention on Attention for Image Captioning",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4633-4642",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129058"}

@inproceedings{bb133019,
        AUTHOR = "Wei, H.Y. and Li, Z.X. and Zhang, C.L.",
        TITLE = "Image Captioning Based on Visual and Semantic Attention",
        BOOKTITLE = MMMod20,
        YEAR = "2020",
        PAGES = "I:151-162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129059"}

@inproceedings{bb133020,
        AUTHOR = "Fukui, H. and Hirakawa, T. and Yamashita, T. and Fujiyoshi, H.",
        TITLE = "Attention Branch Network: Learning of Attention Mechanism for Visual
Explanation",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10697-10706",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129060"}

@inproceedings{bb133021,
        AUTHOR = "Huang, Y. and Li, C. and Li, T. and Wan, W. and Chen, J.",
        TITLE = "Image Captioning with Attribute Refinement",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1820-1824",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129061"}

@inproceedings{bb133022,
        AUTHOR = "Shi, J. and Li, Y. and Wang, S.",
        TITLE = "Cascade Attention: Multiple Feature Based Learning for Image
Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "1970-1974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129062"}

@inproceedings{bb133023,
        AUTHOR = "Xiao, H. and Shi, J.",
        TITLE = "A Novel Attribute Selection Mechanism for Video Captioning",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "619-623",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129063"}

@inproceedings{bb133024,
        AUTHOR = "Wang, Q.Z. and Chan, A.B.",
        TITLE = "Gated Hierarchical Attention for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "IV:21-37",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129064"}

@inproceedings{bb133025,
        AUTHOR = "Wang, W.X. and Chen, Z.H. and Hu, H.F.",
        TITLE = "Multivariate Attention Network for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "VI:587-602",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129065"}

@inproceedings{bb133026,
        AUTHOR = "Ghanimifard, M. and Dobnik, S.",
        TITLE = "Knowing When to Look for What and Where: Evaluating Generation of
Spatial Descriptions with Adaptive Attention",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:153-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129066"}

@inproceedings{bb133027,
        AUTHOR = "Khademi, M. and Schulte, O.",
        TITLE = "Image Caption Generation with Hierarchical Contextual Visual Spatial
Attention",
        BOOKTITLE = Cognitive18,
        YEAR = "2018",
        PAGES = "2024-20248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129067"}

@inproceedings{bb133028,
        AUTHOR = "Wang, F. and Gong, X. and Huang, L.",
        TITLE = "Time-Dependent Pre-attention Model for Image Captioning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3297-3302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129068"}

@inproceedings{bb133029,
        AUTHOR = "Chen, S. and Zhao, Q.",
        TITLE = "Boosted Attention: Leveraging Human Attention for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XI: 72-88",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129069"}

@inproceedings{bb133030,
        AUTHOR = "Fang, F. and Wang, H. and Tang, P.",
        TITLE = "Image Captioning with Word Level Attention",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "1278-1282",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129070"}

@inproceedings{bb133031,
        AUTHOR = "Zhu, Z. and Xue, Z. and Yuan, Z.",
        TITLE = "Topic-Guided Attention for Image Captioning",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2615-2619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129071"}

@inproceedings{bb133032,
        AUTHOR = "Pedersoli, M. and Lucas, T. and Schmid, C. and Verbeek, J.",
        TITLE = "Areas of Attention for Image Captioning",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "1251-1259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129072"}

@inproceedings{bb133033,
        AUTHOR = "Tavakoliy, H.R. and Shetty, R. and Borji, A. and Laaksonen, J.",
        TITLE = "Paying Attention to Descriptions Generated by Image Captioning Models",
        BOOKTITLE = ICCV17,
        YEAR = "2017",
        PAGES = "2506-2515",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129073"}

@inproceedings{bb133034,
        AUTHOR = "Lu, J. and Xiong, C. and Parikh, D. and Socher, R.",
        TITLE = "Knowing When to Look: Adaptive Attention via a Visual Sentinel for
Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3242-3250",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129074"}

@inproceedings{bb133035,
        AUTHOR = "Chen, L. and Zhang, H. and Xiao, J. and Nie, L. and Shao, J. and Liu, W. and Chua, T.S.",
        TITLE = "SCA-CNN: Spatial and Channel-Wise Attention in Convolutional Networks
for Image Captioning",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6298-6306",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129075"}

@inproceedings{bb133036,
        AUTHOR = "Zanfir, M. and Marinoiu, E. and Sminchisescu, C.",
        TITLE = "Spatio-Temporal Attention Models for Grounded Video Captioning",
        BOOKTITLE = ACCV16,
        YEAR = "2016",
        PAGES = "IV: 104-119",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129076"}

@inproceedings{bb133037,
        AUTHOR = "Chen, T.H. and Zeng, K.H. and Hsu, W.T. and Sun, M.",
        TITLE = "Video Captioning via Sentence Augmentation and Spatio-Temporal
Attention",
        BOOKTITLE = Assist16,
        YEAR = "2016",
        PAGES = "I: 269-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129077"}

@inproceedings{bb133038,
        AUTHOR = "Chen, T.L. and Zhang, Z.P. and You, Q.Z. and Fang, C. and Wang, Z.W. and Jin, H.L. and Luo, J.B.",
        TITLE = "'Factual' or 'Emotional':
Stylized Image Captioning with Adaptive Learning and Attention",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "X: 527-543",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129078"}

@inproceedings{bb133039,
        AUTHOR = "You, Q.Z. and Jin, H.L. and Wang, Z.W. and Fang, C. and Luo, J.B.",
        TITLE = "Image Captioning with Semantic Attention",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4651-4659",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607attic3.html#TT129079"}

@article{bb133040,
        AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.",
        TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation",
        JOURNAL = GeoRS,
        VOLUME = "56",
        YEAR = "2018",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "2183-2195",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129080"}

@article{bb133041,
        AUTHOR = "Zhang, X.R. and Wang, X. and Tang, X. and Zhou, H.Y. and Li, C.",
        TITLE = "Description Generation for Remote Sensing Images Using Attribute
Attention Mechanism",
        JOURNAL = RS,
        VOLUME = "11",
        YEAR = "2019",
        NUMBER = "6",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129081"}

@article{bb133042,
        AUTHOR = "Zhang, Z.Y. and Diao, W.H. and Zhang, W.K. and Yan, M.L. and Gao, X. and Sun, X.",
        TITLE = "LAM: Remote Sensing Image Captioning with Label-Attention Mechanism",
        JOURNAL = RS,
        VOLUME = "11",
        YEAR = "2019",
        NUMBER = "20",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129082"}

@article{bb133043,
        AUTHOR = "Fu, K. and Li, Y. and Zhang, W.K. and Yu, H.F. and Sun, X.",
        TITLE = "Boosting Memory with a Persistent Memory Mechanism for Remote Sensing
Image Captioning",
        JOURNAL = RS,
        VOLUME = "12",
        YEAR = "2020",
        NUMBER = "11",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129083"}

@article{bb133044,
        AUTHOR = "Lu, X. and Wang, B. and Zheng, X.",
        TITLE = "Sound Active Attention Framework for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "58",
        YEAR = "2020",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "1985-2000",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129084"}

@article{bb133045,
        AUTHOR = "Li, Y.Y. and Fang, S.K. and Jiao, L.C. and Liu, R.J. and Shang, R.H.",
        TITLE = "A Multi-Level Attention Model for Remote Sensing Image Captions",
        JOURNAL = RS,
        VOLUME = "12",
        YEAR = "2020",
        NUMBER = "6",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129085"}

@article{bb133046,
        AUTHOR = "Li, X.L. and Zhang, X.T. and Huang, W. and Wang, Q.",
        TITLE = "Truncation Cross Entropy Loss for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "5246-5257",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129086"}

@article{bb133047,
        AUTHOR = "Sumbul, G. and Nayak, S. and Demir, B.",
        TITLE = "SD-RSIC: Summarization-Driven Deep Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "6922-6934",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129087"}

@article{bb133048,
        AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.",
        TITLE = "Word-Sentence Framework for Remote Sensing Image Captioning",
        JOURNAL = GeoRS,
        VOLUME = "59",
        YEAR = "2021",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "10532-10543",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129088"}

@article{bb133049,
        AUTHOR = "Yang, Q.Q. and Ni, Z.H. and Ren, P.",
        TITLE = "Meta captioning:
A meta learning based remote sensing image captioning framework",
        JOURNAL = PandRS,
        VOLUME = "186",
        YEAR = "2022",
        PAGES = "190-200",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129089"}

@article{bb133050,
        AUTHOR = "Liu, Z.Y. and Dong, A.M. and Yu, J.G. and Han, Y.B. and Zhou, Y. and Zhao, K.",
        TITLE = "Scene classification for remote sensing images with self-attention
augmented CNN",
        JOURNAL = IET-IPR,
        VOLUME = "16",
        YEAR = "2022",
        NUMBER = "11",
        PAGES = "3085-3096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129090"}

@article{bb133051,
        AUTHOR = "Zhou, H. and Du, X.P. and Xia, L. and Li, S.",
        TITLE = "Self-Learning for Few-Shot Remote Sensing Image Captioning",
        JOURNAL = RS,
        VOLUME = "14",
        YEAR = "2022",
        NUMBER = "18",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129091"}

@article{bb133052,
        AUTHOR = "Wang, Q. and Huang, W. and Zhang, X.T. and Li, X.L.",
        TITLE = "GLCM: Global-Local Captioning Model for Remote Sensing Image
Captioning",
        JOURNAL = Cyber,
        VOLUME = "53",
        YEAR = "2023",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "6910-6922",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129092"}

@article{bb133053,
        AUTHOR = "Cheng, Q. and Xu, Y.Q. and Huang, Z.Y.",
        TITLE = "VCC-DiffNet: Visual Conditional Control Diffusion Network for Remote
Sensing Image Captioning",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "16",
        PAGES = "2961",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129093"}

@article{bb133054,
        AUTHOR = "Li, Y.P. and Zhang, X.R. and Zhang, T.Y. and Wang, G.C. and Wang, X.L. and Li, S.",
        TITLE = "A Patch-Level Region-Aware Module with a Multi-Label Framework for
Remote Sensing Image Captioning",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "21",
        PAGES = "3987",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129094"}

@article{bb133055,
        AUTHOR = "Zhang, K. and Li, P. and Wang, J.Q.",
        TITLE = "A Review of Deep Learning-Based Remote Sensing Image Caption:
Methods, Models, Comparisons and Future Directions",
        JOURNAL = RS,
        VOLUME = "16",
        YEAR = "2024",
        NUMBER = "21",
        PAGES = "4113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129095"}

@article{bb133056,
        AUTHOR = "Leng, G. and Xiong, Y.J. and Qiu, C.P. and Guo, C.Z.",
        TITLE = "Discrete diffusion models with Refined Language-Image Pre-trained
representations for remote sensing image captioning",
        JOURNAL = PRL,
        VOLUME = "186",
        YEAR = "2024",
        PAGES = "164-169",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129096"}

@article{bb133057,
        AUTHOR = "Guo, Z. and Liu, H.M. and Ren, Z. and Jiao, L.C. and Gou, S.P. and Li, R.M.",
        TITLE = "Attribute-Based Learning for Remote Sensing Image Captioning in
Unseen Scenes",
        JOURNAL = RS,
        VOLUME = "17",
        YEAR = "2025",
        NUMBER = "7",
        PAGES = "1237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129097"}

@inproceedings{bb133058,
        AUTHOR = "Wei, Y.C. and Li, L. and Geng, S.L.",
        TITLE = "Remote Sensing Image Captioning Using Hire-MLP",
        BOOKTITLE = CVIDL23,
        YEAR = "2023",
        PAGES = "109-112",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129098"}

@inproceedings{bb133059,
        AUTHOR = "Chavhan, R. and Banerjee, B. and Zhu, X.X. and Chaudhuri, S.",
        TITLE = "A Novel Actor Dual-Critic Model for Remote Sensing Image Captioning",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "4918-4925",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607rsic2.html#TT129099"}

@article{bb133060,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Dense Sampling Low-Level Statistics of Local Features",
        JOURNAL = IEICE,
        VOLUME = "E93-D",
        YEAR = "2010",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1727-1736",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129100"}

@inproceedings{bb133061,
        AUTHOR = "Kuniyoshi, Y. and Harada, T. and Nakayama, H.",
        TITLE = "Dense Sampling Low-Level Statistics of Local Features",
        BOOKTITLE = CIVR09,
        YEAR = "2009",
        PAGES = "Article No 17",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129100"}

@inproceedings{bb133062,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Global Gaussian approach for scene categorization using information
geometry",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "2336-2343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129101"}

@inproceedings{bb133063,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "AI Goggles: Real-time Description and Retrieval in the Real World with
Online Learning",
        BOOKTITLE = CRV09,
        YEAR = "2009",
        PAGES = "184-191",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129102"}

@inproceedings{bb133064,
        AUTHOR = "Ushiku, Y. and Yamaguchi, M. and Mukuta, Y. and Harada, T.",
        TITLE = "Common Subspace for Model and Similarity:
Phrase Learning for Caption Generation from Images",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "2668-2676",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129103"}

@inproceedings{bb133065,
        AUTHOR = "Harada, T. and Nakayama, H. and Kuniyoshi, Y.",
        TITLE = "Improving Local Descriptors by Embedding Global and Local Spatial
Information",
        BOOKTITLE = ECCV10,
        YEAR = "2010",
        PAGES = "IV: 736-749",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129104"}

@inproceedings{bb133066,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Evaluation of dimensionality reduction methods for image
auto-annotation",
        BOOKTITLE = BMVC10,
        YEAR = "2010",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129105"}

@inproceedings{bb133067,
        AUTHOR = "Jin, J. and Nakayama, H.",
        TITLE = "Annotation order matters:
Recurrent Image Annotator for arbitrary length image tagging",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "2452-2457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129106"}

@article{bb133068,
        AUTHOR = "Tariq, A. and Foroosh, H.",
        TITLE = "A Context-Driven Extractive Framework for Generating Realistic Image
Descriptions",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "619-632",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129107"}

@article{bb133069,
        AUTHOR = "Cheng, Q. and Zhang, Q. and Fu, P. and Tu, C.H. and Li, S.",
        TITLE = "A survey and analysis on automatic image annotation",
        JOURNAL = PR,
        VOLUME = "79",
        YEAR = "2018",
        PAGES = "242-259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129108"}

@article{bb133070,
        AUTHOR = "Ben Rejeb, I. and Ouni, S. and Barhoumi, W. and Zagrouba, E.",
        TITLE = "Fuzzy VA-Files for multi-label image annotation based on visual content
of regions",
        JOURNAL = SIViP,
        VOLUME = "12",
        YEAR = "2018",
        NUMBER = "5",
        MONTH = "July",
        PAGES = "877-884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129109"}

@article{bb133071,
        AUTHOR = "Helmy, T.",
        TITLE = "A Generic Framework for Semantic Annotation of Images",
        JOURNAL = IJIG,
        VOLUME = "18",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "July",
        PAGES = "Article 1850013",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129110"}

@article{bb133072,
        AUTHOR = "Hu, J. and Lam, K.M. and Lou, P. and Liu, Q. and Deng, W.P.",
        TITLE = "Can a machine have two systems for recognition, like human beings?",
        JOURNAL = JVCIR,
        VOLUME = "56",
        YEAR = "2018",
        PAGES = "275-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129111"}

@article{bb133073,
        AUTHOR = "Bhagat, P.K. and Choudhary, P.",
        TITLE = "Image annotation: Then and now",
        JOURNAL = IVC,
        VOLUME = "80",
        YEAR = "2018",
        PAGES = "1-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129112"}

@article{bb133074,
        AUTHOR = "Bazrafkan, S. and Javidnia, H. and Corcoran, P.",
        TITLE = "Latent space mapping for generation of object elements with
corresponding data annotation",
        JOURNAL = PRL,
        VOLUME = "116",
        YEAR = "2018",
        PAGES = "179-186",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129113"}

@article{bb133075,
        AUTHOR = "Jiu, M.Y. and Sahbi, H.",
        TITLE = "Deep representation design from deep kernel networks",
        JOURNAL = PR,
        VOLUME = "88",
        YEAR = "2019",
        PAGES = "447-457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129114"}

@article{bb133076,
        AUTHOR = "Foumani, S.N.M. and Nickabadi, A.",
        TITLE = "A probabilistic topic model using deep visual word representation for
simultaneous image classification and annotation",
        JOURNAL = JVCIR,
        VOLUME = "59",
        YEAR = "2019",
        PAGES = "195-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129115"}

@article{bb133077,
        AUTHOR = "Zhang, J.J. and Wu, Q. and Zhang, J. and Shen, C.H. and Lu, J.F. and Wu, Q.A.",
        TITLE = "Heritage image annotation via collective knowledge",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "204-214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129116"}

@article{bb133078,
        AUTHOR = "Verma, Y.",
        TITLE = "Diverse image annotation with missing labels",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "470-484",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129117"}

@article{bb133079,
        AUTHOR = "Markatopoulou, F. and Mezaris, V. and Patras, I.",
        TITLE = "Implicit and Explicit Concept Relations in Deep Neural Networks for
Multi-Label Video/Image Annotation",
        JOURNAL = CirSysVideo,
        VOLUME = "29",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1631-1644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129118"}

@article{bb133080,
        AUTHOR = "Laib, L. and Allili, M.S. and Ait Aoudia, S.",
        TITLE = "A probabilistic topic model for event-based image classification and
multi-label annotation",
        JOURNAL = SP:IC,
        VOLUME = "76",
        YEAR = "2019",
        PAGES = "283-294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129119"}

@article{bb133081,
        AUTHOR = "Olaode, A. and Naghdy, G.",
        TITLE = "Review of the application of machine learning to the automatic semantic
annotation of images",
        JOURNAL = IET-IPR,
        VOLUME = "13",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "1232-1245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129120"}

@article{bb133082,
        AUTHOR = "Zhang, C.J. and Cheng, J. and Tian, Q.",
        TITLE = "Multiview, Few-Labeled Object Categorization by Predicting Labels
With View Consistency",
        JOURNAL = Cyber,
        VOLUME = "49",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3834-3843",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129121"}

@article{bb133083,
        AUTHOR = "Tang, C. and Liu, X.W. and Wang, P.C. and Zhang, C.Q. and Li, M.M. and Wang, L.Z.",
        TITLE = "Adaptive Hypergraph Embedded Semi-Supervised Multi-Label Image
Annotation",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "2837-2849",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129122"}

@article{bb133084,
        AUTHOR = "Mundnich, K. and Booth, B.M. and Girault, B. and Narayanan, S.",
        TITLE = "Generating labels for regression of subjective constructs using
triplet embeddings",
        JOURNAL = PRL,
        VOLUME = "128",
        YEAR = "2019",
        PAGES = "385-392",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129123"}

@article{bb133085,
        AUTHOR = "Chaudhary, C. and Goyal, P. and Prasad, D.N. and Chen, Y.P.",
        TITLE = "Enhancing the Quality of Image Tagging Using a Visio-Textual
Knowledge Base",
        JOURNAL = MultMed,
        VOLUME = "22",
        YEAR = "2020",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "897-911",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129124"}

@article{bb133086,
        AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.",
        TITLE = "Architecture to improve the accuracy of automatic image annotation
systems",
        JOURNAL = IET-CV,
        VOLUME = "14",
        YEAR = "2020",
        NUMBER = "5",
        MONTH = "August",
        PAGES = "214-223",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129125"}

@article{bb133087,
        AUTHOR = "Theodosiou, Z. and Tsapatsoulis, N.",
        TITLE = "Image annotation: the effects of content, lexicon and annotation method",
        JOURNAL = MultInfoRetr,
        VOLUME = "9",
        YEAR = "2020",
        NUMBER = "3",
        MONTH = "September",
        PAGES = "191-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129126"}

@article{bb133088,
        AUTHOR = "Haghighi, F. and Taher, M.R.H. and Zhou, Z.W. and Gotway, M.B. and Liang, J.M.",
        TITLE = "Transferable Visual Words: Exploiting the Semantics of Anatomical
Patterns for Self-Supervised Learning",
        JOURNAL = MedImg,
        VOLUME = "40",
        YEAR = "2021",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "2857-2868",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129127"}

@article{bb133089,
        AUTHOR = "Hochberg, D.C. and Greenspan, H. and Giryes, R.",
        TITLE = "A Self Supervised StyleGAN for Image Annotation and Classification
With Extremely Limited Labels",
        JOURNAL = MedImg,
        VOLUME = "41",
        YEAR = "2022",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "3509-3519",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129128"}

@inproceedings{bb133090,
        AUTHOR = "Lahtinen, T. and Turtiainen, H. and Costin, A.",
        TITLE = "Brima: Low-Overhead Browser-Only Image Annotation Tool (Preprint)",
        BOOKTITLE = ICIP21,
        YEAR = "2021",
        PAGES = "2633-2637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129129"}

@inproceedings{bb133091,
        AUTHOR = "Lotfi, F. and Jamzad, M. and Beigy, H.",
        TITLE = "Automatic Image Annotation using Tag Relations and Graph
Convolutional Networks",
        BOOKTITLE = IPRIA21,
        YEAR = "2021",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129130"}

@inproceedings{bb133092,
        AUTHOR = "Chen, X.Y. and Jiang, M. and Zhao, Q.",
        TITLE = "Self-Distillation for Few-Shot Image Captioning",
        BOOKTITLE = WACV21,
        YEAR = "2021",
        PAGES = "545-555",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129131"}

@inproceedings{bb133093,
        AUTHOR = "Jiu, M. and Sahbi, H.",
        TITLE = "End-to-End Deep Kernel Map Design for Image Annotation",
        BOOKTITLE = ICIP20,
        YEAR = "2020",
        PAGES = "1546-1550",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129132"}

@inproceedings{bb133094,
        AUTHOR = "Hu, H. and Misra, I. and van der Maaten, L.",
        TITLE = "Evaluating Text-to-Image Matching using Binary Image Selection
(BISON)",
        BOOKTITLE = CLVL19,
        YEAR = "2019",
        PAGES = "1887-1890",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129133"}

@inproceedings{bb133095,
        AUTHOR = "Gupta, T. and Schwing, A.G. and Hoiem, D.",
        TITLE = "ViCo: Word Embeddings From Visual Co-Occurrences",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "7424-7433",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129134"}

@inproceedings{bb133096,
        AUTHOR = "Bracha, L. and Chechik, G.",
        TITLE = "Informative Object Annotations: Tell Me Something I Don't Know",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "12499-12507",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129135"}

@inproceedings{bb133097,
        AUTHOR = "Rapson, C.J. and Seet, B. and Naeem, M.A. and Lee, J.E. and Al Sarayreh, M. and Klette, R.",
        TITLE = "Reducing the Pain: A Novel Tool for Efficient Ground-Truth Labelling
in Images",
        BOOKTITLE = IVCNZ18,
        YEAR = "2018",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129136"}

@inproceedings{bb133098,
        AUTHOR = "Wu, B.Y. and Chen, W.D. and Sun, P. and Liu, W. and Ghanem, B. and Lyu, S.W.",
        TITLE = "Tagging Like Humans: Diverse and Distinct Image Annotation",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7967-7975",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129137"}

@inproceedings{bb133099,
        AUTHOR = "Wu, X.J. and Zhang, L. and Li, F.Z. and Wang, B.J.",
        TITLE = "A Novel Model for Multi-label Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "1953-1958",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ian2.html#TT129138"}

Last update:Oct 6, 2025 at 14:07:43