@inproceedings{bb95300,
        AUTHOR = "Kuniyoshi, Y. and Harada, T. and Nakayama, H.",
        TITLE = "Dense Sampling Low-Level Statistics of Local Features",
        BOOKTITLE = CIVR09,
        YEAR = "2009",
        PAGES = "Article No 17",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91826"}

@inproceedings{bb95301,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Global Gaussian approach for scene categorization using information
geometry",
        BOOKTITLE = CVPR10,
        YEAR = "2010",
        PAGES = "2336-2343",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91827"}

@inproceedings{bb95302,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "AI Goggles: Real-time Description and Retrieval in the Real World with
Online Learning",
        BOOKTITLE = CRV09,
        YEAR = "2009",
        PAGES = "184-191",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91828"}

@inproceedings{bb95303,
        AUTHOR = "Ushiku, Y. and Yamaguchi, M. and Mukuta, Y. and Harada, T.",
        TITLE = "Common Subspace for Model and Similarity:
Phrase Learning for Caption Generation from Images",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "2668-2676",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91829"}

@inproceedings{bb95304,
        AUTHOR = "Jin, J. and Nakayama, H.",
        TITLE = "Annotation order matters:
Recurrent Image Annotator for arbitrary length image tagging",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "2452-2457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91830"}

@inproceedings{bb95305,
        AUTHOR = "Harada, T. and Nakayama, H. and Kuniyoshi, Y.",
        TITLE = "Improving Local Descriptors by Embedding Global and Local Spatial
Information",
        BOOKTITLE = ECCV10,
        YEAR = "2010",
        PAGES = "IV: 736-749",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91831"}

@inproceedings{bb95306,
        AUTHOR = "Nakayama, H. and Harada, T. and Kuniyoshi, Y.",
        TITLE = "Evaluation of dimensionality reduction methods for image
auto-annotation",
        BOOKTITLE = BMVC10,
        YEAR = "2010",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91832"}

@article{bb95307,
        AUTHOR = "Verma, Y. and Jawahar, C.V.",
        TITLE = "A support vector approach for cross-modal search of images and texts",
        JOURNAL = CVIU,
        VOLUME = "154",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "48-63",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91833"}

@article{bb95308,
        AUTHOR = "Xue, J.F. and Eguchi, K.",
        TITLE = "Video Data Modeling Using Sequential Correspondence Hierarchical
Dirichlet Processes",
        JOURNAL = IEICE,
        VOLUME = "E100-D",
        YEAR = "2017",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "33-41",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91834"}

@article{bb95309,
        AUTHOR = "Tariq, A. and Foroosh, H.",
        TITLE = "A Context-Driven Extractive Framework for Generating Realistic Image
Descriptions",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "619-632",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91835"}

@article{bb95310,
        AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.",
        TITLE = "Show and Tell: Lessons Learned from the 2015 MSCOCO Image Captioning
Challenge",
        JOURNAL = PAMI,
        VOLUME = "39",
        YEAR = "2017",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "652-663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91836"}

@inproceedings{bb95311,
        AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.",
        TITLE = "Show and tell: A neural image caption generator",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "3156-3164",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91837"}

@article{bb95312,
        AUTHOR = "Gao, L. and Guo, Z. and Zhang, H. and Xu, X. and Shen, H.T.",
        TITLE = "Video Captioning With Attention-Based LSTM and Semantic Consistency",
        JOURNAL = MultMed,
        VOLUME = "19",
        YEAR = "2017",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2045-2055",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91838"}

@article{bb95313,
        AUTHOR = "Hu, M. and Yang, Y. and Shen, F. and Zhang, L. and Shen, H.T. and Li, X.",
        TITLE = "Robust Web Image Annotation via Exploring Multi-Facet and Structural
Knowledge",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "4871-4884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91839"}

@article{bb95314,
        AUTHOR = "Bin, Y. and Yang, Y. and Shen, F. and Xie, N. and Shen, H.T. and Li, X.",
        TITLE = "Describing Video With Attention-Based Bidirectional LSTM",
        JOURNAL = Cyber,
        VOLUME = "49",
        YEAR = "2019",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "2631-2641",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91840"}

@article{bb95315,
        AUTHOR = "Wang, J.Y. and Zhu, X.T. and Gong, S.G.",
        TITLE = "Discovering visual concept structure with sparse and incomplete tags",
        JOURNAL = AI,
        VOLUME = "250",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "16-36",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91841"}

@article{bb95316,
        AUTHOR = "Kilickaya, M. and Akkus, B.K. and Cakici, R. and Erdem, A. and Erdem, E. and Ikizler Cinbis, N.",
        TITLE = "Data-driven image captioning via salient region discovery",
        JOURNAL = IET-CV,
        VOLUME = "11",
        YEAR = "2017",
        NUMBER = "6",
        MONTH = "September",
        PAGES = "398-406",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91842"}

@article{bb95317,
        AUTHOR = "Fu, K. and Jin, J.Q. and Cui, R.P. and Sha, F. and Zhang, C.S.",
        TITLE = "Aligning Where to See and What to Tell: Image Captioning with
Region-Based Attention and Scene-Specific Contexts",
        JOURNAL = PAMI,
        VOLUME = "39",
        YEAR = "2017",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "2321-2334",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91843"}

@article{bb95318,
        AUTHOR = "Liu, A.A. and Xu, N. and Wong, Y. and Li, J. and Su, Y.T. and Kankanhalli, M.",
        TITLE = "Hierarchical & multimodal video captioning: Discovering and
transferring multimodal knowledge for vision to language",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "113-125",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91844"}

@article{bb95319,
        AUTHOR = "Nian, F.D. and Li, T. and Wang, Y. and Wu, X.Y. and Ni, B.B. and Xu, C.S.",
        TITLE = "Learning explicit video attributes from mid-level representation for
video captioning",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "126-138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91845"}

@article{bb95320,
        AUTHOR = "He, X.D. and Deng, L.",
        TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview",
        JOURNAL = SPMag,
        VOLUME = "34",
        YEAR = "2017",
        NUMBER = "6",
        MONTH = "November",
        PAGES = "109-116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91846"}

@article{bb95321,
        AUTHOR = "Deng, L. and He, X.D.",
        TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview",
        JOURNAL = SPMag,
        VOLUME = "35",
        YEAR = "2018",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91846"}

@article{bb95322,
        AUTHOR = "Li, L.H. and Tang, S. and Zhang, Y.D. and Deng, L.X. and Tian, Q.",
        TITLE = "GLA: Global-Local Attention for Image Description",
        JOURNAL = MultMed,
        VOLUME = "20",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "726-737",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91847"}

@article{bb95323,
        AUTHOR = "Guan, J.N. and Wang, E.",
        TITLE = "Repeated review based image captioning for image evidence review",
        JOURNAL = SP:IC,
        VOLUME = "63",
        YEAR = "2018",
        PAGES = "141-148",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91848"}

@article{bb95324,
        AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.",
        TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation",
        JOURNAL = GeoRS,
        VOLUME = "56",
        YEAR = "2018",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "2183-2195",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91849"}

@article{bb95325,
        AUTHOR = "Cheng, Q. and Zhang, Q. and Fu, P. and Tu, C.H. and Li, S.",
        TITLE = "A survey and analysis on automatic image annotation",
        JOURNAL = PR,
        VOLUME = "79",
        YEAR = "2018",
        PAGES = "242-259",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91850"}

@article{bb95326,
        AUTHOR = "Ben Rejeb, I. and Ouni, S. and Barhoumi, W. and Zagrouba, E.",
        TITLE = "Fuzzy VA-Files for multi-label image annotation based on visual content
of regions",
        JOURNAL = SIViP,
        VOLUME = "12",
        YEAR = "2018",
        NUMBER = "5",
        MONTH = "July",
        PAGES = "877-884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91851"}

@article{bb95327,
        AUTHOR = "Helmy, T.",
        TITLE = "A Generic Framework for Semantic Annotation of Images",
        JOURNAL = IJIG,
        VOLUME = "18",
        YEAR = "2018",
        NUMBER = "3",
        MONTH = "July",
        PAGES = "Article 1850013",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91852"}

@article{bb95328,
        AUTHOR = "Wu, C.L. and Wei, Y. and Chu, X.L. and Su, F. and Wang, L.",
        TITLE = "Modeling visual and word-conditional semantic attention for image
captioning",
        JOURNAL = SP:IC,
        VOLUME = "67",
        YEAR = "2018",
        PAGES = "100-107",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91853"}

@article{bb95329,
        AUTHOR = "Ye, S. and Han, J. and Liu, N.",
        TITLE = "Attentive Linear Transformation for Image Captioning",
        JOURNAL = IP,
        VOLUME = "27",
        YEAR = "2018",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "5514-5524",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91854"}

@article{bb95330,
        AUTHOR = "Zhang, M. and Yang, Y. and Zhang, H. and Ji, Y. and Shen, H.T. and Chua, T.",
        TITLE = "More is Better: Precise and Detailed Image Captioning Using Online
Positive Recall and Missing Concepts Mining",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "32-44",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91855"}

@article{bb95331,
        AUTHOR = "Hu, J. and Lam, K.M. and Lou, P. and Liu, Q. and Deng, W.P.",
        TITLE = "Can a machine have two systems for recognition, like human beings?",
        JOURNAL = JVCIR,
        VOLUME = "56",
        YEAR = "2018",
        PAGES = "275-286",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91856"}

@article{bb95332,
        AUTHOR = "Bhagat, P.K. and Choudhary, P.",
        TITLE = "Image annotation: Then and now",
        JOURNAL = IVC,
        VOLUME = "80",
        YEAR = "2018",
        PAGES = "1-23",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91857"}

@article{bb95333,
        AUTHOR = "Gil Gonzalez, J. and Alvarez Meza, A. and Orozco Gutierrez, A.",
        TITLE = "Learning from multiple annotators using kernel alignment",
        JOURNAL = PRL,
        VOLUME = "116",
        YEAR = "2018",
        PAGES = "150-156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91858"}

@article{bb95334,
        AUTHOR = "Bazrafkan, S. and Javidnia, H. and Corcoran, P.",
        TITLE = "Latent space mapping for generation of object elements with
corresponding data annotation",
        JOURNAL = PRL,
        VOLUME = "116",
        YEAR = "2018",
        PAGES = "179-186",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91859"}

@article{bb95335,
        AUTHOR = "Gella, S. and Keller, F. and Lapata, M.",
        TITLE = "Disambiguating Visual Verbs",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "2",
        MONTH = "February",
        PAGES = "311-322",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91860"}

@article{bb95336,
        AUTHOR = "Xu, N. and Liu, A.A. and Liu, J. and Nie, W.Z. and Su, Y.T.",
        TITLE = "Scene graph captioner:
Image captioning based on structural visual representation",
        JOURNAL = JVCIR,
        VOLUME = "58",
        YEAR = "2019",
        PAGES = "477-485",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91861"}

@article{bb95337,
        AUTHOR = "Niu, Y. and Lu, Z. and Wen, J. and Xiang, T. and Chang, S.",
        TITLE = "Multi-Modal Multi-Scale Deep Learning for Large-Scale Image
Annotation",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "1720-1731",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91862"}

@article{bb95338,
        AUTHOR = "Jiu, M.Y. and Sahbi, H.",
        TITLE = "Deep representation design from deep kernel networks",
        JOURNAL = PR,
        VOLUME = "88",
        YEAR = "2019",
        PAGES = "447-457",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91863"}

@article{bb95339,
        AUTHOR = "He, X.W. and Shi, B.G. and Bai, X. and Xia, G.S. and Zhang, Z.X. and Dong, W.S.",
        TITLE = "Image Caption Generation with Part of Speech Guidance",
        JOURNAL = PRL,
        VOLUME = "119",
        YEAR = "2019",
        PAGES = "229-237",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91864"}

@article{bb95340,
        AUTHOR = "Park, C.C. and Kim, B. and Kim, G.",
        TITLE = "Towards Personalized Image Captioning via Multimodal Memory Networks",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "999-1012",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91865"}

@inproceedings{bb95341,
        AUTHOR = "Park, C.C. and Kim, B. and Kim, G.",
        TITLE = "Attend to You: Personalized Image Captioning with Context Sequence
Memory Networks",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6432-6440",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91866"}

@article{bb95342,
        AUTHOR = "Xiao, X.Y. and Wang, L.F. and Ding, K. and Xiang, S.M. and Pan, C.",
        TITLE = "Dense semantic embedding network for image captioning",
        JOURNAL = PR,
        VOLUME = "90",
        YEAR = "2019",
        PAGES = "285-296",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91867"}

@article{bb95343,
        AUTHOR = "Yang, M. and Zhao, W. and Xu, W. and Feng, Y. and Zhao, Z. and Chen, X. and Lei, K.",
        TITLE = "Multitask Learning for Cross-Domain Image Captioning",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "1047-1061",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91868"}

@article{bb95344,
        AUTHOR = "Foumani, S.N.M. and Nickabadi, A.",
        TITLE = "A probabilistic topic model using deep visual word representation for
simultaneous image classification and annotation",
        JOURNAL = JVCIR,
        VOLUME = "59",
        YEAR = "2019",
        PAGES = "195-203",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91869"}

@article{bb95345,
        AUTHOR = "Zhang, X.R. and Wang, X. and Tang, X. and Zhou, H.Y. and Li, C.",
        TITLE = "Description Generation for Remote Sensing Images Using Attribute
Attention Mechanism",
        JOURNAL = RS,
        VOLUME = "11",
        YEAR = "2019",
        NUMBER = "6",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91870"}

@article{bb95346,
        AUTHOR = "Zheng, H. and Wu, J. and Liang, R. and Li, Y. and Li, X.",
        TITLE = "Multi-task learning for captioning images with novel words",
        JOURNAL = IET-CV,
        VOLUME = "13",
        YEAR = "2019",
        NUMBER = "3",
        MONTH = "April",
        PAGES = "294-301",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91871"}

@article{bb95347,
        AUTHOR = "Yu, N. and Hu, X. and Song, B. and Yang, J. and Zhang, J.",
        TITLE = "Topic-Oriented Image Captioning Based on Order-Embedding",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "2743-2754",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91872"}

@article{bb95348,
        AUTHOR = "Ding, S.T. and Qu, S. and Xi, Y.L. and Sangaiah, A.K. and Wan, S.H.",
        TITLE = "Image caption generation with high-level image features",
        JOURNAL = PRL,
        VOLUME = "123",
        YEAR = "2019",
        PAGES = "89-95",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91873"}

@article{bb95349,
        AUTHOR = "Liu, X.X. and Xu, Q.Y. and Wang, N.",
        TITLE = "A survey on deep neural network-based image captioning",
        JOURNAL = VC,
        VOLUME = "35",
        YEAR = "2019",
        NUMBER = "3",
        MONTH = "March",
        PAGES = "445-470",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91874"}

@article{bb95350,
        AUTHOR = "Hossain, M.Z. and Sohel, F. and Shiratuddin, M.F. and Laga, H.",
        TITLE = "A Comprehensive Survey of Deep Learning for Image Captioning",
        JOURNAL = Surveys,
        VOLUME = "51",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "February",
        PAGES = "Article No 118",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91875"}

@article{bb95351,
        AUTHOR = "Peng, Y.Q. and Liu, X. and Wang, W.H. and Zhao, X.S. and Wei, M.",
        TITLE = "Image caption model of double LSTM with scene factors",
        JOURNAL = IVC,
        VOLUME = "86",
        YEAR = "2019",
        PAGES = "38-44",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91876"}

@article{bb95352,
        AUTHOR = "Zhang, J.J. and Wu, Q. and Zhang, J. and Shen, C.H. and Lu, J.F. and Wu, Q.A.",
        TITLE = "Heritage image annotation via collective knowledge",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "204-214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91877"}

@article{bb95353,
        AUTHOR = "Verma, Y.",
        TITLE = "Diverse image annotation with missing labels",
        JOURNAL = PR,
        VOLUME = "93",
        YEAR = "2019",
        PAGES = "470-484",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91878"}

@article{bb95354,
        AUTHOR = "Markatopoulou, F. and Mezaris, V. and Patras, I.",
        TITLE = "Implicit and Explicit Concept Relations in Deep Neural Networks for
Multi-Label Video/Image Annotation",
        JOURNAL = CirSysVideo,
        VOLUME = "29",
        YEAR = "2019",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1631-1644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91879"}

@article{bb95355,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "High-Quality Image Captioning With Fine-Grained and Semantic-Guided
Visual Attention",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "1681-1693",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91880"}

@inproceedings{bb95356,
        AUTHOR = "Zhang, Z.J. and Wu, Q. and Wang, Y. and Chen, F.",
        TITLE = "Fine-Grained and Semantic-Guided Visual Attention for Image
Captioning",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1709-1717",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91881"}

@article{bb95357,
        AUTHOR = "Laib, L. and Allili, M.S. and Ait Aoudia, S.",
        TITLE = "A probabilistic topic model for event-based image classification and
multi-label annotation",
        JOURNAL = SP:IC,
        VOLUME = "76",
        YEAR = "2019",
        PAGES = "283-294",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91882"}

@article{bb95358,
        AUTHOR = "Olaode, A. and Naghdy, G.",
        TITLE = "Review of the application of machine learning to the automatic semantic
annotation of images",
        JOURNAL = IET-IPR,
        VOLUME = "13",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "June",
        PAGES = "1232-1245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91883"}

@article{bb95359,
        AUTHOR = "Li, X. and Jiang, S.",
        TITLE = "Know More Say Less: Image Captioning Based on Scene Graphs",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "2117-2130",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91884"}

@article{bb95360,
        AUTHOR = "Zhang, C.J. and Cheng, J. and Tian, Q.",
        TITLE = "Multiview, Few-Labeled Object Categorization by Predicting Labels
With View Consistency",
        JOURNAL = Cyber,
        VOLUME = "49",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "3834-3843",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91885"}

@article{bb95361,
        AUTHOR = "Xian, Y. and Tian, Y.",
        TITLE = "Self-Guiding Multimodal LSTM: When We Do Not Have a Perfect Training
Dataset for Image Captioning",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "5241-5252",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91886"}

@article{bb95362,
        AUTHOR = "Li, X. and Xu, C. and Wang, X. and Lan, W. and Jia, Z. and Yang, G. and Xu, J.",
        TITLE = "COCO-CN for Cross-Lingual Image Tagging, Captioning, and Retrieval",
        JOURNAL = MultMed,
        VOLUME = "21",
        YEAR = "2019",
        NUMBER = "9",
        MONTH = "September",
        PAGES = "2347-2360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91887"}

@article{bb95363,
        AUTHOR = "Zakharov, N. and Su, H. and Zhu, J. and Glascher, J.",
        TITLE = "Towards controllable image descriptions with semi-supervised VAE",
        JOURNAL = JVCIR,
        VOLUME = "63",
        YEAR = "2019",
        PAGES = "102574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91888"}

@article{bb95364,
        AUTHOR = "Tian, C. and Tian, M. and Jiang, M.M. and Liu, H. and Deng, D.H.",
        TITLE = "How much do cross-modal related semantics benefit image captioning by
weighting attributes and re-ranking sentences?",
        JOURNAL = PRL,
        VOLUME = "125",
        YEAR = "2019",
        PAGES = "639-645",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91889"}

@inproceedings{bb95365,
        AUTHOR = "Wang, Q.Z. and Chan, A.B.",
        TITLE = "Gated Hierarchical Attention for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "IV:21-37",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91890"}

@inproceedings{bb95366,
        AUTHOR = "Wang, W. and Chen, Z.H. and Hu, H.F.",
        TITLE = "Multivariate Attention Network for Image Captioning",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "VI:587-602",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91891"}

@inproceedings{bb95367,
        AUTHOR = "Ghanimifard, M. and Dobnik, S.",
        TITLE = "Knowing When to Look for What and Where: Evaluating Generation of
Spatial Descriptions with Adaptive Attention",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:153-161",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91892"}

@inproceedings{bb95368,
        AUTHOR = "Kim, B. and Lee, Y.H. and Jung, H. and Cho, C.",
        TITLE = "Distinctive-Attribute Extraction for Image Captioning",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:133-144",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91893"}

@inproceedings{bb95369,
        AUTHOR = "Tanti, M. and Gatt, A. and Muscat, A.",
        TITLE = "Pre-gen Metrics: Predicting Caption Quality Metrics Without Generating
Captions",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:114-123",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91894"}

@inproceedings{bb95370,
        AUTHOR = "Tanti, M. and Gatt, A. and Camilleri, K.P.",
        TITLE = "Quantifying the Amount of Visual Information Used by Neural Caption
Generators",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:124-132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91895"}

@inproceedings{bb95371,
        AUTHOR = "Ren, L. and Qi, G. and Hua, K.",
        TITLE = "Improving Diversity of Image Captioning Through Variational
Autoencoders and Adversarial Learning",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "263-272",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91896"}

@inproceedings{bb95372,
        AUTHOR = "Zhou, Y. and Sun, Y. and Honavar, V.",
        TITLE = "Improving Image Captioning by Leveraging Knowledge Graphs",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "283-293",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91897"}

@inproceedings{bb95373,
        AUTHOR = "Rapson, C.J. and Seet, B. and Naeem, M.A. and Lee, J.E. and Al Sarayreh, M. and Klette, R.",
        TITLE = "Reducing the Pain: A Novel Tool for Efficient Ground-Truth Labelling
in Images",
        BOOKTITLE = IVCNZ18,
        YEAR = "2018",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91898"}

@inproceedings{bb95374,
        AUTHOR = "Lu, J.S. and Yang, J.W. and Batra, D. and Parikh, D.",
        TITLE = "Neural Baby Talk",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7219-7228",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91899"}

@inproceedings{bb95375,
        AUTHOR = "Wu, B.Y. and Chen, W.D. and Sun, P. and Liu, W. and Ghanem, B. and Lyu, S.W.",
        TITLE = "Tagging Like Humans: Diverse and Distinct Image Annotation",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7967-7975",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91900"}

@inproceedings{bb95376,
        AUTHOR = "Wu, X.J. and Zhang, L. and Li, F.Z. and Wang, B.J.",
        TITLE = "A Novel Model for Multi-label Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "1953-1958",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91901"}

@inproceedings{bb95377,
        AUTHOR = "Jiu, M. and Sahbi, H. and Qi, L.",
        TITLE = "Deep Context Networks for Image Annotation",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2422-2427",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91902"}

@inproceedings{bb95378,
        AUTHOR = "Khademi, M. and Schulte, O.",
        TITLE = "Image Caption Generation with Hierarchical Contextual Visual Spatial
Attention",
        BOOKTITLE = Cognitive18,
        YEAR = "2018",
        PAGES = "2024-20248",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91903"}

@inproceedings{bb95379,
        AUTHOR = "Yan, S. and Wu, F. and Smith, J.S. and Lu, W. and Zhang, B.",
        TITLE = "Image Captioning using Adversarial Networks and Reinforcement
Learning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "248-253",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91904"}

@inproceedings{bb95380,
        AUTHOR = "Wang, F. and Gong, X. and Huang, L.",
        TITLE = "Time-Dependent Pre-attention Model for Image Captioning",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3297-3302",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91905"}

@inproceedings{bb95381,
        AUTHOR = "Luo, R. and Shakhnarovich, G. and Cohen, S. and Price, B.",
        TITLE = "Discriminability Objective for Training Descriptive Captions",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6964-6974",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91906"}

@inproceedings{bb95382,
        AUTHOR = "Cui, Y. and Yang, G. and Veit, A. and Huang, X. and Belongie, S.",
        TITLE = "Learning to Evaluate Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5804-5812",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91907"}

@inproceedings{bb95383,
        AUTHOR = "Aneja, J. and Deshpande, A. and Schwing, A.G.",
        TITLE = "Convolutional Image Captioning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5561-5570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91908"}

@inproceedings{bb95384,
        AUTHOR = "Chen, F. and Ji, R. and Sun, X. and Wu, Y. and Su, J.",
        TITLE = "GroupCap: Group-Based Image Captioning with Structured Relevance and
Diversity Constraints",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1345-1353",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91909"}

@inproceedings{bb95385,
        AUTHOR = "Chen, X. and Ma, L. and Jiang, W. and Yao, J. and Liu, W.",
        TITLE = "Regularizing RNNs for Caption Generation by Reconstructing the Past
with the Present",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7995-8003",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91910"}

@inproceedings{bb95386,
        AUTHOR = "Yao, T. and Pan, Y.W. and Li, Y. and Mei, T.",
        TITLE = "Exploring Visual Relationship for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIV: 711-727",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91911"}

@inproceedings{bb95387,
        AUTHOR = "Shah, S.A.A.",
        TITLE = "NNEval: Neural Network Based Evaluation Metric for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 39-55",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91912"}

@inproceedings{bb95388,
        AUTHOR = "Jiang, W.H. and Ma, L. and Jiang, Y.G. and Liu, W. and Zhang, T.",
        TITLE = "Recurrent Fusion Network for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 510-526",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91913"}

@inproceedings{bb95389,
        AUTHOR = "Chatterjee, M. and Schwing, A.G.",
        TITLE = "Diverse and Coherent Paragraph Generation from Images",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 747-763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91914"}

@inproceedings{bb95390,
        AUTHOR = "Chen, S. and Zhao, Q.",
        TITLE = "Boosted Attention: Leveraging Human Attention for Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XI: 72-88",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91915"}

@inproceedings{bb95391,
        AUTHOR = "Dai, B. and Ye, D. and Lin, D.",
        TITLE = "Rethinking the Form of Latent States in Image Captioning",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 294-310",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91916"}

@inproceedings{bb95392,
        AUTHOR = "Liu, X. and Li, H.S. and Shao, J. and Chen, D.P. and Wang, X.G.",
        TITLE = "Show, Tell and Discriminate:
Image Captioning by Self-retrieval with Partially Labeled Data",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 353-369",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91917"}

@inproceedings{bb95393,
        AUTHOR = "Fang, F. and Wang, H. and Tang, P.",
        TITLE = "Image Captioning with Word Level Attention",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "1278-1282",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91918"}

@inproceedings{bb95394,
        AUTHOR = "Zhu, Z. and Xue, Z. and Yuan, Z.",
        TITLE = "Topic-Guided Attention for Image Captioning",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2615-2619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91919"}

@inproceedings{bb95395,
        AUTHOR = "Gomez Garay, A. and Raducanu, B. and Salas, J.",
        TITLE = "Dense Captioning of Natural Scenes in Spanish",
        BOOKTITLE = MCPR18,
        YEAR = "2018",
        PAGES = "145-154",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91920"}

@inproceedings{bb95396,
        AUTHOR = "Yao, L. and Ballas, N. and Cho, K. and Smith, J. and Bengio, Y.",
        TITLE = "Oracle Performance for Visual Captioning",
        BOOKTITLE = BMVC16,
        YEAR = "2016",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91921"}

@inproceedings{bb95397,
        AUTHOR = "Khatchatoorian, A.G. and Jamzad, M.",
        TITLE = "Post Rectifying Methods to Improve the Accuracy of Image Annotation",
        BOOKTITLE = DICTA17,
        YEAR = "2017",
        PAGES = "1-7",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91922"}

@inproceedings{bb95398,
        AUTHOR = "Dong, H. and Zhang, J.Q. and McIlwraith, D. and Guo, Y.",
        TITLE = "I2T2I: Learning text to image synthesis with textual data
augmentation",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "2015-2019",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91923"}

@inproceedings{bb95399,
        AUTHOR = "Pellegrin, L. and Escalante, H.J. and Montes y Gomez, M. and Villegas, M. and Gonzalez, F.A.",
        TITLE = "A Flexible Framework for the Evaluation of Unsupervised Image
Annotation",
        BOOKTITLE = CIARP17,
        YEAR = "2017",
        PAGES = "508-516",
        BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT91924"}

Last update:Sep 9, 2019 at 16:26:55