@inproceedings{bb121400, AUTHOR = "Liu, D.C. and Wang, Y. and Mase, K.J. and Kato, J.", TITLE = "Attention-Based Multi-Task Learning for Fine-Grained Image Classification", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "1499-1503", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117517"} @article{bb121401, AUTHOR = "Deng, W.J. and Marsh, J. and Gould, S. and Zheng, L.", TITLE = "Fine-Grained Classification via Categorical Memory Networks", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "4186-4196", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117518"} @article{bb121402, AUTHOR = "Zhu, J.W. and Li, Z.X. and Wei, J. and Zeng, Y.F. and Ma, H.F.", TITLE = "Fine-grained bidirectional attentional generation and knowledge-assisted networks for cross-modal retrieval", JOURNAL = IVC, VOLUME = "124", YEAR = "2022", PAGES = "104507", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117519"} @article{bb121403, AUTHOR = "Lang, W.X. and Sun, H. and Xu, C. and Liu, N.Z. and Zhou, H.Y.", TITLE = "Discriminative feature mining hashing for fine-grained image retrieval", JOURNAL = JVCIR, VOLUME = "87", YEAR = "2022", PAGES = "103592", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117520"} @article{bb121404, AUTHOR = "Sun, H. and Lang, W.X. and Xu, C. and Liu, N.Z. and Zhou, H.Y.", TITLE = "Graph-based discriminative features learning for fine-grained image retrieval", JOURNAL = SP:IC, VOLUME = "110", YEAR = "2023", PAGES = "116885", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117521"} @article{bb121405, AUTHOR = "Liu, K.J. and Chen, K. and Jia, K.", TITLE = "Convolutional Fine-Grained Classification With Self-Supervised Target Relation Regularization", JOURNAL = IP, VOLUME = "31", YEAR = "2022", PAGES = "5570-5584", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117522"} @inproceedings{bb121406, AUTHOR = "Yang, X. and Wang, Y. and Chen, K. and Xu, Y. and Tian, Y.H.", TITLE = "Fine-Grained Object Classification via Self-Supervised Pose Alignment", BOOKTITLE = CVPR22, YEAR = "2022", PAGES = "7389-7398", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117523"} @article{bb121407, AUTHOR = "Han, J.W. and Yao, X. and Cheng, G. and Feng, X.X. and Xu, D.", TITLE = "P-CNN: Part-Based Convolutional Neural Networks for Fine-Grained Visual Categorization", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "2", MONTH = "February", PAGES = "579-590", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117524"} @article{bb121408, AUTHOR = "Koniusz, P. and Zhang, H.G.", TITLE = "Power Normalizations in Fine-Grained Image, Few-Shot Image and Graph Classification", JOURNAL = PAMI, VOLUME = "44", YEAR = "2022", NUMBER = "2", MONTH = "February", PAGES = "591-609", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117525"} @article{bb121409, AUTHOR = "Sun, X. and Wang, P.J. and Yan, Z.Y. and Xu, F. and Wang, R.P. and Diao, W.H. and Chen, J. and Li, J. and Feng, Y.C. and Xu, T. and Weinmann, M. and Hinz, S. and Wang, C. and Fu, K.", TITLE = "FAIR1M: A benchmark dataset for fine-grained object recognition in high-resolution remote sensing imagery", JOURNAL = PandRS, VOLUME = "184", YEAR = "2022", PAGES = "116-130", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117526"} @article{bb121410, AUTHOR = "Xu, Q. and Zhang, M.Q. and Li, Y. and Tao, Z.", TITLE = "Learning more discriminative clues with gradual attention for fine-grained visual categorization", JOURNAL = IVC, VOLUME = "136", YEAR = "2023", PAGES = "104753", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117527"} @article{bb121411, AUTHOR = "Yu, H. and Lu, H. and Zhao, M. and Li, Z.Y. and Gu, G.H.", TITLE = "Gradient aggregation based fine-grained image retrieval: A unified viewpoint for CNN and Transformer", JOURNAL = PR, VOLUME = "149", YEAR = "2024", PAGES = "110248", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117528"} @inproceedings{bb121412, AUTHOR = "Xu, Z.R. and Yu, F.X. and Liu, C.X. and Wu, Z. and Wang, H.C. and Chen, X.", TITLE = "FalCon: Fine-grained Feature Map Sparsity Computing with Decomposed Convolutions for Inference Optimization", BOOKTITLE = WACV22, YEAR = "2022", PAGES = "3634-3644", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117529"} @inproceedings{bb121413, AUTHOR = "Mahmoudi, M.A. and Chetouani, A. and Boufera, F. and Tabia, H.", TITLE = "Taylor Series Kernelized Layer for Fine-Grained Recognition", BOOKTITLE = ICIP21, YEAR = "2021", PAGES = "1914-1918", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117530"} @inproceedings{bb121414, AUTHOR = "Cheng, J.C. and Vasconcelos, N.M.", TITLE = "Learning Deep Classifiers Consistent with Fine-Grained Novelty Detection", BOOKTITLE = CVPR21, YEAR = "2021", PAGES = "1664-1673", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117531"} @inproceedings{bb121415, AUTHOR = "Ji, R. and Wen, L. and Zhang, L. and Du, D. and Wu, Y. and Zhao, C. and Liu, X. and Huang, F.", TITLE = "Attention Convolutional Binary Neural Tree for Fine-Grained Visual Categorization", BOOKTITLE = CVPR20, YEAR = "2020", PAGES = "10465-10474", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117532"} @inproceedings{bb121416, AUTHOR = "Taherkhani, F. and Kazemi, H. and Dabouei, A. and Dawson, J. and Nasrabadi, N.", TITLE = "A Weakly Supervised Fine Label Classifier Enhanced by Coarse Supervision", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "6458-6467", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117533"} @inproceedings{bb121417, AUTHOR = "Yang, H. and Wu, H. and Chen, H.", TITLE = "Detecting 11K Classes: Large Scale Object Detection Without Fine-Grained Bounding Boxes", BOOKTITLE = ICCV19, YEAR = "2019", PAGES = "9804-9812", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117534"} @inproceedings{bb121418, AUTHOR = "Wagner, J. and Kohler, J.M. and Gindele, T. and Hetzel, L. and Wiedemer, J.T. and Behnke, S.", TITLE = "Interpretable and Fine-Grained Visual Explanations for Convolutional Neural Networks", BOOKTITLE = CVPR19, YEAR = "2019", PAGES = "9089-9099", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117535"} @inproceedings{bb121419, AUTHOR = "Feng, Z. and Fu, K. and Zhao, Q.", TITLE = "Learning to Focus and Discriminate for Fine-Grained Classification", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "415-419", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117536"} @inproceedings{bb121420, AUTHOR = "Xin, Q. and Lv, T. and Gao, H.", TITLE = "Random Part Localization Model for Fine Grained Image Classification", BOOKTITLE = ICIP19, YEAR = "2019", PAGES = "420-424", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117537"} @inproceedings{bb121421, AUTHOR = "Zhong, W. and Jiang, L. and Zhang, T. and Ji, J. and Xiong, H.", TITLE = "A Multi-part Convolutional Attention Network for Fine-Grained Image Recognition", BOOKTITLE = ICPR18, YEAR = "2018", PAGES = "1857-1862", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117538"} @inproceedings{bb121422, AUTHOR = "Simonelli, A. and de Natale, F.G.B. and Messelodi, S. and Bulo, S.R.", TITLE = "Increasingly Specialized Ensemble of Convolutional Neural Networks for Fine-Grained Recognition", BOOKTITLE = ICIP18, YEAR = "2018", PAGES = "594-598", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117539"} @inproceedings{bb121423, AUTHOR = "Wang, Y. and Morariu, V.I. and Davis, L.S.", TITLE = "Learning a Discriminative Filter Bank Within a CNN for Fine-Grained Recognition", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "4148-4157", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117540"} @inproceedings{bb121424, AUTHOR = "Cai, S.J. and Zuo, W.M. and Zhang, L.", TITLE = "Higher-Order Integration of Hierarchical Convolutional Activations for Fine-Grained Visual Categorization", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "511-520", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117541"} @inproceedings{bb121425, AUTHOR = "Kong, S. and Fowlkes, C.C.", TITLE = "Pixel-Wise Attentional Gating for Scene Parsing", BOOKTITLE = WACV19, YEAR = "2019", PAGES = "1024-1033", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117542"} @inproceedings{bb121426, AUTHOR = "Kong, S. and Fowlkes, C.C.", TITLE = "Recurrent Scene Parsing with Perspective Understanding in the Loop", BOOKTITLE = CVPR18, YEAR = "2018", PAGES = "956-965", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117543"} @inproceedings{bb121427, AUTHOR = "Zheng, H. and Fu, J. and Mei, T. and Luo, J.", TITLE = "Learning Multi-attention Convolutional Neural Network for Fine-Grained Image Recognition", BOOKTITLE = ICCV17, YEAR = "2017", PAGES = "5219-5227", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117544"} @inproceedings{bb121428, AUTHOR = "Fu, J. and Zheng, H. and Mei, T.", TITLE = "Look Closer to See Better: Recurrent Attention Convolutional Neural Network for Fine-Grained Image Recognition", BOOKTITLE = CVPR17, YEAR = "2017", PAGES = "4476-4484", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117545"} @inproceedings{bb121429, AUTHOR = "Ge, Z.Y. and McCool, C. and Sanderson, C. and Wang, P. and Liu, L.Q. and Reid, I.D. and Corke, P.", TITLE = "Exploiting Temporal Information for DCNN-Based Fine-Grained Object Classification", BOOKTITLE = DICTA16, YEAR = "2016", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117546"} @inproceedings{bb121430, AUTHOR = "Ai, S.S. and Jia, C.Y. and Chen, Z.N.", TITLE = "Large-Scale Product Classification via Spatial Attention Based CNN Learning and Multi-class Regression", BOOKTITLE = MMMod17, YEAR = "2017", PAGES = "I: 176-188", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117547"} @inproceedings{bb121431, AUTHOR = "Diba, A. and Pazandeh, A.M. and Pirsiavash, H. and Van Gool, L.J.", TITLE = "DeepCAMP: Deep Convolutional Action Attribute Mid-Level Patterns", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "3557-3565", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117548"} @inproceedings{bb121432, AUTHOR = "Zhang, H. and Xu, T. and Elhoseiny, M. and Huang, X.L. and Zhang, S.T. and Elgammal, A.E. and Metaxas, D.N.", TITLE = "SPDA-CNN: Unifying Semantic Part Detection and Abstraction for Fine-Grained Recognition", BOOKTITLE = CVPR16, YEAR = "2016", PAGES = "1143-1152", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117549"} @inproceedings{bb121433, AUTHOR = "Chevalier, M. and Thome, N. and Cord, M. and Fournier, J. and Henaff, G. and Dusch, E.", TITLE = "LR-CNN for fine-grained classification with varying resolution", BOOKTITLE = ICIP15, YEAR = "2015", PAGES = "3101-3105", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117550"} @inproceedings{bb121434, AUTHOR = "Ge, Z. and Bewley, A. and McCool, C. and Corke, P. and Upcroft, B. and Sanderson, C.", TITLE = "Fine-grained classification via mixture of deep convolutional neural networks", BOOKTITLE = WACV16, YEAR = "2016", PAGES = "1-6", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117551"} @inproceedings{bb121435, AUTHOR = "Ge, Z. and McCool, C. and Sanderson, C. and Corke, P.", TITLE = "Modelling local deep convolutional neural network features to improve fine-grained image classification", BOOKTITLE = ICIP15, YEAR = "2015", PAGES = "4112-4116", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117552"} @inproceedings{bb121436, AUTHOR = "Zhang, N. and Donahue, J. and Girshick, R. and Darrell, T.J.", TITLE = "Part-Based R-CNNs for Fine-Grained Category Detection", BOOKTITLE = ECCV14, YEAR = "2014", PAGES = "I: 834-849", BIBSOURCE = "http://www.visionbib.com/bibliography/match605cnnfg2.html#TT117553"} @article{bb121437, AUTHOR = "Taylor, S.L. and Dahl, D.A. and Lipshutz, M. and Weir, C. and Norton, L.M. and Nilson, R.W. and Linebarger, M.C.", TITLE = "Integrating Natural-Language Understanding with Document Structure-Analysis", JOURNAL = AIR, VOLUME = "8", YEAR = "1994", NUMBER = "2-3", PAGES = "255-276", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117554"} @article{bb121438, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Theory", JOURNAL = AIR, VOLUME = "9", YEAR = "1995", NUMBER = "4-5", MONTH = "October", PAGES = "247-250", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117555"} @book{bb121439, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Theory", PUBLISHER = "Springer", YEAR = "1995", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117555"} @article{bb121440, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Intelligent Multimedia", JOURNAL = AIR, VOLUME = "9", YEAR = "1995", NUMBER = "2-3", MONTH = "June", PAGES = "77-80", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117556"} @article{bb121441, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: More Computational Models and Systems", JOURNAL = AIR, VOLUME = "8", YEAR = "1995", NUMBER = "5-6", PAGES = "345-348", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117557"} @article{bb121442, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Computational Models and Systems", JOURNAL = AIR, VOLUME = "8", YEAR = "1994", NUMBER = "2-3", PAGES = "99-104", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117558"} @book{bb121443, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Computational Models and Systems", PUBLISHER = "Kluwer", YEAR = "1995", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117558"} @article{bb121444, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural-Language and Vision Processing: Grounding Representations", JOURNAL = AIR, VOLUME = "10", YEAR = "1996", NUMBER = "1-2", MONTH = "April", PAGES = "7-13", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117559"} @book{bb121445, AUTHOR = "McKevitt, P.", TITLE = "Integration of Natural Language and Vision Processing", PUBLISHER = "Kluwer", YEAR = "1996", MONTH = "September", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117560"} @article{bb121446, AUTHOR = "Siskind, J.M.", TITLE = "Grounding Language in Perception", JOURNAL = AIR, VOLUME = "8", YEAR = "1995", NUMBER = "5-6", PAGES = "371-391", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117561"} @article{bb121447, AUTHOR = "Srihari, R.K.", TITLE = "Automatic-Indexing and Content-Based Retrieval of Captioned Images", JOURNAL = Computer, VOLUME = "28", YEAR = "1995", NUMBER = "9", MONTH = "September", PAGES = "49-56", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117562"} @article{bb121448, AUTHOR = "Srihari, R.K.", TITLE = "Use of Captions and Other Collateral Text in Understanding Photographs", JOURNAL = AIR, VOLUME = "8", YEAR = "1995", NUMBER = "5-6", PAGES = "409-430", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117563"} @article{bb121449, AUTHOR = "Srihari, R.K.", TITLE = "Use of Collateral Text in Understanding Photos in Documents", JOURNAL = SPIE, VOLUME = "2368", YEAR = "1994", PAGES = "186-199", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117564"} @article{bb121450, AUTHOR = "Srihari, R.K.", TITLE = "Computational Models for Integrating Linguistic and Visual Information: A Survey", JOURNAL = AIR, VOLUME = "8", YEAR = "1995", NUMBER = "5-6", PAGES = "349-369", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117565"} @inproceedings{bb121451, AUTHOR = "Srihari, R.K.", TITLE = "Using Linguistic Context for Image Interpretation and Annotation", BOOKTITLE = "Radius97", YEAR = "1997", PAGES = "419-427", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117566"} @inproceedings{bb121452, AUTHOR = "Srihari, R.K.", TITLE = "Linguistic Context In Vision", BOOKTITLE = Context95, YEAR = "1995", PAGES = "xx", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117567"} @inproceedings{bb121453, AUTHOR = "Srihari, R.K. and Zhang, Z. and Venkatraman, M. and Chopra, R.", TITLE = "Using Speech Input for Image Interpretation and Annotation", BOOKTITLE = ARPA96, YEAR = "1996", PAGES = "501-510", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117568"} @inproceedings{bb121454, AUTHOR = "Burhans, D.T. and Chopra, R. and Srihari, R.K. and Govindaraju, V. and Venkataraman, M.", TITLE = "Use of Collateral Text in Image Interpretation", BOOKTITLE = ARPA94, YEAR = "1994", PAGES = "II:897-907", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117569"} @inproceedings{bb121455, AUTHOR = "Srihari, R.K. and Burhans, D.T.", TITLE = "Visual Semantics: Extracting Visual Information from Text Accompanying Pictures", BOOKTITLE = AAAI-94, YEAR = "1994", PAGES = "793-798", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117570"} @inproceedings{bb121456, AUTHOR = "Govindaraju, V. and Srihari, S.N. and Sher, D.B.", TITLE = "Caption-Aided Face Location In Newspaper Photographs", BOOKTITLE = ICPR92, YEAR = "1992", PAGES = "I:474-477", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117571"} @inproceedings{bb121457, AUTHOR = "Govindaraju, V. and Srihari, S.N. and Sher, D.B.", TITLE = "A Computational Model for Face Location Based on Cognitive Principles", BOOKTITLE = AAAI-92, YEAR = "1992", PAGES = "350-355", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117572"} @article{bb121458, AUTHOR = "Schank, R.C. and Fano, A.", TITLE = "Memory and Expectations in Learning, Language, and Visual Understanding", JOURNAL = AIR, VOLUME = "9", YEAR = "1995", NUMBER = "4-5", MONTH = "October", PAGES = "261-271", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117573"} @article{bb121459, AUTHOR = "Wilks, Y.", TITLE = "Language, Vision and Metaphor", JOURNAL = AIR, VOLUME = "9", YEAR = "1995", NUMBER = "4-5", MONTH = "October", PAGES = "273-289", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117574"} @article{bb121460, AUTHOR = "Partridge, D.", TITLE = "Language and Vision: A Single Perceptual Mechanism", JOURNAL = AIR, VOLUME = "9", YEAR = "1995", NUMBER = "4-5", MONTH = "October", PAGES = "291-303", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117575"} @article{bb121461, AUTHOR = "Marconi, D.", TITLE = "Work on the Integration of Language and Vision at the University of Torino", JOURNAL = AIR, VOLUME = "10", YEAR = "1996", NUMBER = "1-2", MONTH = "April", PAGES = "15-20", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117576"} @article{bb121462, AUTHOR = "Meini, C. and Paternoster, A.", TITLE = "Understanding Language Through Vision", JOURNAL = AIR, VOLUME = "10", YEAR = "1996", NUMBER = "1-2", MONTH = "April", PAGES = "37-48", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117577"} @article{bb121463, AUTHOR = "McKevitt, P. and Guo, C.M.", TITLE = "From Chinese Rooms to Irish Rooms: New Words on Visions for Language", JOURNAL = AIR, VOLUME = "10", YEAR = "1996", NUMBER = "1-2", MONTH = "April", PAGES = "49-63", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117578"} @article{bb121464, AUTHOR = "Grumbach, A.", TITLE = "Grounding Symbols into Perceptions", JOURNAL = AIR, VOLUME = "10", YEAR = "1996", NUMBER = "1-2", MONTH = "April", PAGES = "131-146", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117579"} @article{bb121465, AUTHOR = "Socher, G. and Sagerer, G.F. and Perona, P.", TITLE = "Bayesian reasoning on qualitative descriptions from images and speech", JOURNAL = IVC, VOLUME = "18", YEAR = "2000", NUMBER = "2", MONTH = "January", PAGES = "155-172", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117580"} @article{bb121466, AUTHOR = "Mukerjee, A. and Gupta, K. and Nautiyal, S. and Singh, M.P. and Mishra, N.", TITLE = "Conceptual description of visual scenes from linguistic models", JOURNAL = IVC, VOLUME = "18", YEAR = "2000", NUMBER = "2", MONTH = "January", PAGES = "173-187", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117581"} @article{bb121467, AUTHOR = "Arens, M. and Gerber, R. and Nagel, H.H.", TITLE = "Conceptual representations between video signals and natural language descriptions", JOURNAL = IVC, VOLUME = "26", YEAR = "2008", NUMBER = "1", MONTH = "January", PAGES = "53-66", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117582"} @inproceedings{bb121468, AUTHOR = "Gerber, R. and Nagel, H.H.", TITLE = "(Mis?-) Using DRT for Generation of Natural Language Text from Image Sequences", BOOKTITLE = ECCV98, YEAR = "1998", PAGES = "II: 255", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117583"} @article{bb121469, AUTHOR = "Lee, Y.J. and Grauman, K.", TITLE = "Object-Graphs for Context-Aware Visual Category Discovery", JOURNAL = PAMI, VOLUME = "34", YEAR = "2012", NUMBER = "2", MONTH = "February", PAGES = "346-358", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117584"} @inproceedings{bb121470, AUTHOR = "Lee, Y.J. and Grauman, K.", TITLE = "Object-graphs for context-aware category discovery", BOOKTITLE = CVPR10, YEAR = "2010", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117585"} @inproceedings{bb121471, AUTHOR = "Lee, Y.J. and Grauman, K.", TITLE = "Learning the easy things first: Self-paced visual category discovery", BOOKTITLE = CVPR11, YEAR = "2011", PAGES = "1721-1728", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117586"} @article{bb121472, AUTHOR = "Yu, A. and Grauman, K.", TITLE = "Densifying Supervision for Fine-Grained Visual Comparisons", JOURNAL = IJCV, VOLUME = "128", YEAR = "2020", NUMBER = "10-11", MONTH = "November", PAGES = "2704-2730", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117587"} @inproceedings{bb121473, AUTHOR = "Hessel, J. and Hwang, J.D. and Park, J.S. and Zellers, R. and Bhagavatula, C. and Rohrbach, A. and Saenko, K. and Choi, Y.", TITLE = "The Abduction of Sherlock Holmes: A Dataset for Visual Abductive Reasoning", BOOKTITLE = ECCV22, YEAR = "2022", PAGES = "XXXVI:558-575", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117588"} @inproceedings{bb121474, AUTHOR = "Perona, P.", TITLE = "A taxonomy of visual recognition", BOOKTITLE = VMV04, YEAR = "2004", PAGES = "187", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117589"} @inproceedings{bb121475, AUTHOR = "Takahashi, T. and Nakanishi, S. and Kuno, Y. and Shirai, Y.", TITLE = "Helping Computer Vision by Verbal and Nonverbal Communication", BOOKTITLE = ICPR98, YEAR = "1998", PAGES = "Vol II: 1216-1218", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117590"} @inproceedings{bb121476, AUTHOR = "Satoh, S. and Nakamura, Y. and Kanade, T.", TITLE = "Name-It: Naming and Detecting Faces in Video by the Integration of Image and Natural Language Processing", BOOKTITLE = IJCAI97, YEAR = "1997", PAGES = "1488-1495", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117591"} @inproceedings{bb121477, AUTHOR = "Satoh, S. and Kanade, T.", TITLE = "Name-It: Association Of Face And Name In Video", BOOKTITLE = CVPR97, YEAR = "1997", PAGES = "368-373", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117592"} @inproceedings{bb121478, AUTHOR = "Socher, G. and Sagerer, G.F. and Kummert, F. and Fuhr, T.", TITLE = "Talking About 3D Scenes: Integration of Image and Speech Understanding in a Hybrid Distributed System", BOOKTITLE = ICIP96, YEAR = "1996", PAGES = "II: 809-812", BIBSOURCE = "http://www.visionbib.com/bibliography/match605.html#TT117593"} @article{bb121479, AUTHOR = "Kuniyoshi, Y. and Inaba, M. and Inoue, H.", TITLE = "Learning by Watching: Extracting Reusable Task Knowledge from Visual Observation of Human Performance", JOURNAL = RA, VOLUME = "10", YEAR = "1994", PAGES = "799-822", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117594"} @inproceedings{bb121480, AUTHOR = "Kuniyoshi, Y. and Inoue, H.", TITLE = "Indexicality and dynamic attention control in qualitative recognition of assembly actions", BOOKTITLE = ECCV92, YEAR = "1992", PAGES = "874-878", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117595"} @article{bb121481, AUTHOR = "Porway, J. and Wang, Q.C. and Zhu, S.C.", TITLE = "A Hierarchical and Contextual Model for Aerial Image Parsing", JOURNAL = IJCV, VOLUME = "88", YEAR = "2010", NUMBER = "2", MONTH = "June", PAGES = "xx-yy", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117596"} @inproceedings{bb121482, AUTHOR = "Porway, J. and Wang, K. and Yao, B. and Zhu, S.C.", TITLE = "A hierarchical and contextual model for aerial image understanding", BOOKTITLE = CVPR08, YEAR = "2008", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117597"} @inproceedings{bb121483, AUTHOR = "Si, Z.Z. and Gong, H.F. and Wu, Y.N. and Zhu, S.C.", TITLE = "Learning mixed templates for object recognition", BOOKTITLE = CVPR09, YEAR = "2009", PAGES = "272-279", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117598"} @article{bb121484, AUTHOR = "Tu, Z.W. and Bai, X.", TITLE = "Auto-Context and Its Application to High-Level Vision Tasks and 3D Brain Image Segmentation", JOURNAL = PAMI, VOLUME = "32", YEAR = "2010", NUMBER = "10", MONTH = "October", PAGES = "1744-1757", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117599"} @inproceedings{bb121485, AUTHOR = "Tu, Z.W.", TITLE = "Auto-context and its application to high-level vision tasks", BOOKTITLE = CVPR08, YEAR = "2008", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117600"} @inproceedings{bb121486, AUTHOR = "Jones, J. and Hager, G.D. and Khudanpur, S.", TITLE = "Toward Computer Vision Systems That Understand Real-World Assembly Processes", BOOKTITLE = WACV19, YEAR = "2019", PAGES = "426-434", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117601"} @inproceedings{bb121487, AUTHOR = "Lampert, C.H.", TITLE = "Partitioning of image datasets using discriminative context information", BOOKTITLE = CVPR08, YEAR = "2008", PAGES = "1-8", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117602"} @inproceedings{bb121488, AUTHOR = "Hansen, C. and Henderson, T.C.", TITLE = "Towards the Automatic Generation of Recognition Strategies", BOOKTITLE = ICCV88, YEAR = "1988", PAGES = "275-279", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117603"} @inproceedings{bb121489, AUTHOR = "Cantoni, V. and Cei, U. and Ferretti, M. and Lombardi, L.", TITLE = "Towards an Automatic Construction of Object Recognition Strategies", BOOKTITLE = ICPR88, YEAR = "1988", PAGES = "I: 371-374", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117604"} @inproceedings{bb121490, AUTHOR = "Cova, G. and Griffini, A. and Lombardi, L.", TITLE = "Object Recognition Strategy in a Multi-Resolution System", BOOKTITLE = CIAP89, YEAR = "1989", PAGES = "729-733", BIBSOURCE = "http://www.visionbib.com/bibliography/match606.html#TT117605"} @article{bb121491, AUTHOR = "Feng, Y.S. and Lapata, M.", TITLE = "Automatic Caption Generation for News Images", JOURNAL = PAMI, VOLUME = "35", YEAR = "2013", NUMBER = "4", MONTH = "April", PAGES = "797-812", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117606"} @article{bb121492, AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.", TITLE = "Show and Tell: Lessons Learned from the 2015 MSCOCO Image Captioning Challenge", JOURNAL = PAMI, VOLUME = "39", YEAR = "2017", NUMBER = "4", MONTH = "April", PAGES = "652-663", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117607"} @inproceedings{bb121493, AUTHOR = "Vinyals, O. and Toshev, A. and Bengio, S. and Erhan, D.", TITLE = "Show and tell: A neural image caption generator", BOOKTITLE = CVPR15, YEAR = "2015", PAGES = "3156-3164", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117608"} @article{bb121494, AUTHOR = "Wang, J.Y. and Zhu, X.T. and Gong, S.G.", TITLE = "Discovering visual concept structure with sparse and incomplete tags", JOURNAL = AI, VOLUME = "250", YEAR = "2017", NUMBER = "1", PAGES = "16-36", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117609"} @article{bb121495, AUTHOR = "Kilickaya, M. and Akkus, B.K. and Cakici, R. and Erdem, A. and Erdem, E. and Ikizler Cinbis, N.", TITLE = "Data-driven image captioning via salient region discovery", JOURNAL = IET-CV, VOLUME = "11", YEAR = "2017", NUMBER = "6", MONTH = "September", PAGES = "398-406", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117610"} @article{bb121496, AUTHOR = "He, X.D. and Deng, L.", TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview", JOURNAL = SPMag, VOLUME = "34", YEAR = "2017", NUMBER = "6", MONTH = "November", PAGES = "109-116", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117611"} @article{bb121497, AUTHOR = "Deng, L. and He, X.D.", TITLE = "Deep Learning for Image-to-Text Generation: A Technical Overview", JOURNAL = SPMag, VOLUME = "35", YEAR = "2018", NUMBER = "1", MONTH = "January", PAGES = "178", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117611"} @article{bb121498, AUTHOR = "Li, L.H. and Tang, S. and Zhang, Y.D. and Deng, L.X. and Tian, Q.", TITLE = "GLA: Global-Local Attention for Image Description", JOURNAL = MultMed, VOLUME = "20", YEAR = "2018", NUMBER = "3", MONTH = "March", PAGES = "726-737", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117612"} @article{bb121499, AUTHOR = "Lu, X. and Wang, B. and Zheng, X. and Li, X.", TITLE = "Exploring Models and Data for Remote Sensing Image Caption Generation", JOURNAL = GeoRS, VOLUME = "56", YEAR = "2018", NUMBER = "4", MONTH = "April", PAGES = "2183-2195", BIBSOURCE = "http://www.visionbib.com/bibliography/match607ic1.html#TT117613"}