@inproceedings{bb157100,
        AUTHOR = "McLoughlin, E. and O'Sullivan, D. and Bertolotto, M. and Wilson, D.",
        TITLE = "A Knowledge Management System for Intelligent Retrieval of Geo-Spatial
Imagery",
        BOOKTITLE = CIVR04,
        YEAR = "2004",
        PAGES = "535-544",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152628"}

@inproceedings{bb157101,
        AUTHOR = "Fan, X.D. and Geman, D.",
        TITLE = "Hierarchical object indexing and sequential learning",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "III: 65-68",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152629"}

@inproceedings{bb157102,
        AUTHOR = "Schneidewind, A. and Neumann, P. and Schmitt, I.",
        TITLE = "An Approach to Visualize Image Retrieval Results",
        BOOKTITLE = MMDE04,
        YEAR = "2004",
        PAGES = "148",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152630"}

@inproceedings{bb157103,
        AUTHOR = "Bouchaffra, D. and Tan, J.",
        TITLE = "Introduction to the concept of structural HMM:
Application to Mining Customers' Preferences in Automotive Design",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "II: 493-496",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152631"}

@inproceedings{bb157104,
        AUTHOR = "Chelkh, F.A. and Cramariuc, B. and Gabbouj, M.",
        TITLE = "Relevance feedback for shape query refinement",
        BOOKTITLE = ICIP03,
        YEAR = "2003",
        PAGES = "I: 745-748",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152632"}

@inproceedings{bb157105,
        AUTHOR = "Tesic, J. and Manjunath, B.S.",
        TITLE = "Nearest neighbor search for relevance feedback",
        BOOKTITLE = CVPR03,
        YEAR = "2003",
        PAGES = "II: 643-648",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152633"}

@inproceedings{bb157106,
        AUTHOR = "Vicario, E. and He, W.X.",
        TITLE = "Weighted walkthroughs in retrieval by contents of pictorial data",
        BOOKTITLE = CIAP97,
        YEAR = "1997",
        PAGES = "II: 132-139",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat802.html#TT152634"}

@article{bb157107,
        AUTHOR = "Wu, Y.C. and Yang, J.C.",
        TITLE = "A Robust Passage Retrieval Algorithm for Video Question Answering",
        JOURNAL = CirSysVideo,
        VOLUME = "18",
        YEAR = "2008",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1411-1421",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152638"}

@inproceedings{bb157108,
        AUTHOR = "Wu, Y.C. and Lee, Y.S. and Yang, J.C. and Yen, S.J.",
        TITLE = "A New Passage Ranking Algorithm for Video Question Answering",
        BOOKTITLE = PSIVT06,
        YEAR = "2006",
        PAGES = "563-572",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152639"}

@article{bb157109,
        AUTHOR = "Li, G.D. and Li, H. and Ming, Z.Y. and Hong, R. and Tang, S. and Chua, T.S.",
        TITLE = "Question Answering over Community-Contributed Web Videos",
        JOURNAL = MultMedMag,
        VOLUME = "17",
        YEAR = "2010",
        NUMBER = "4",
        MONTH = "October",
        PAGES = "46-57",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152640"}

@inproceedings{bb157110,
        AUTHOR = "Song, Y.C. and Li, H.",
        TITLE = "Mash-Up Approach for Web Video Category Recommendation",
        BOOKTITLE = PSIVT10,
        YEAR = "2010",
        PAGES = "197-202",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152641"}

@article{bb157111,
        AUTHOR = "Agrawal, A. and Lu, J. and Antol, S. and Mitchell, M. and Zitnick, C.L. and Parikh, D. and Batra, D.",
        TITLE = "VQA: Visual Question Answering",
        JOURNAL = IJCV,
        VOLUME = "123",
        YEAR = "2017",
        NUMBER = "1",
        MONTH = "May",
        PAGES = "4-31",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152642"}

@article{bb157112,
        AUTHOR = "Xue, H. and Zhao, Z. and Cai, D.",
        TITLE = "Unifying the Video and Question Attentions for Open-Ended Video
Question Answering",
        JOURNAL = IP,
        VOLUME = "26",
        YEAR = "2017",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "5656-5666",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152643"}

@article{bb157113,
        AUTHOR = "Xue, H. and Chu, W. and Zhao, Z. and Cai, D.",
        TITLE = "A Better Way to Attend: Attention With Trees for Video Question
Answering",
        JOURNAL = IP,
        VOLUME = "27",
        YEAR = "2018",
        NUMBER = "11",
        MONTH = "November",
        PAGES = "5563-5574",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152644"}

@article{bb157114,
        AUTHOR = "Malinowski, M. and Rohrbach, M. and Fritz, M.",
        TITLE = "Ask Your Neurons: A Deep Learning Approach to Visual Question Answering",
        JOURNAL = IJCV,
        VOLUME = "125",
        YEAR = "2018",
        NUMBER = "1-3",
        MONTH = "December",
        PAGES = "110-135",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152645"}

@inproceedings{bb157115,
        AUTHOR = "Malinowski, M. and Rohrbach, M. and Fritz, M.",
        TITLE = "Ask Your Neurons:
A Neural-Based Approach to Answering Questions about Images",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "1-9",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152646"}

@article{bb157116,
        AUTHOR = "Kafle, K. and Kanan, C.",
        TITLE = "Visual question answering:
Datasets, algorithms, and future challenges",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "3-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152647"}

@article{bb157117,
        AUTHOR = "Wu, Q. and Teney, D. and Wang, P. and Shen, C.H. and Dick, A. and van den Hengel, A.J.",
        TITLE = "Visual question answering: A survey of methods and datasets",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "21-40",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152648"}

@article{bb157118,
        AUTHOR = "Tamaazousti, Y. and Borgne, H.L. and Popescu, A. and Gadeski, E. and Ginsca, A. and Hudelot, C.",
        TITLE = "Vision-language integration using constrained local semantic features",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "41-57",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152649"}

@article{bb157119,
        AUTHOR = "Das, A. and Agrawal, H. and Zitnick, L. and Parikh, D. and Batra, D.",
        TITLE = "Human Attention in Visual Question Answering:
Do Humans and Deep Networks Look at the Same Regions?",
        JOURNAL = CVIU,
        VOLUME = "163",
        YEAR = "2017",
        NUMBER = "1",
        PAGES = "90-100",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152650"}

@article{bb157120,
        AUTHOR = "Teney, D. and Wu, Q. and van den Hengel, A.J.",
        TITLE = "Visual Question Answering: A Tutorial",
        JOURNAL = SPMag,
        VOLUME = "34",
        YEAR = "2017",
        NUMBER = "6",
        MONTH = "November",
        PAGES = "63-75",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152651"}

@inproceedings{bb157121,
        AUTHOR = "Teney, D. and Liu, L. and van den Hengel, A.J.",
        TITLE = "Graph-Structured Representations for Visual Question Answering",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3233-3241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152652"}

@inproceedings{bb157122,
        AUTHOR = "Teney, D. and van den Hengel, A.J.",
        TITLE = "Visual Question Answering as a Meta Learning Task",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 229-245",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152653"}

@article{bb157123,
        AUTHOR = "Wu, Q. and Shen, C.H. and Wang, P. and Dick, A. and van den Hengel, A.J.",
        TITLE = "Image Captioning and Visual Question Answering Based on Attributes
and External Knowledge",
        JOURNAL = PAMI,
        VOLUME = "40",
        YEAR = "2018",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1367-1381",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152654"}

@inproceedings{bb157124,
        AUTHOR = "Wu, Q. and Wang, P. and Shen, C.H. and Dick, A. and van den Hengel, A.J.",
        TITLE = "Ask Me Anything: Free-Form Visual Question Answering Based on
Knowledge from External Sources",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "4622-4630",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152655"}

@article{bb157125,
        AUTHOR = "Lioutas, V. and Passalis, N. and Tefas, A.",
        TITLE = "Explicit ensemble attention learning for improving visual question
answering",
        JOURNAL = PRL,
        VOLUME = "111",
        YEAR = "2018",
        PAGES = "51-57",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152656"}

@article{bb157126,
        AUTHOR = "Huang, Y.Z. and Zhong, T.",
        TITLE = "Multitask learning for neural generative question answering",
        JOURNAL = RealTimeIP,
        VOLUME = "14",
        YEAR = "2018",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "1009-1017",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152657"}

@article{bb157127,
        AUTHOR = "Zhang, Q.S. and Wu, Y.N. and Zhang, H. and Zhu, S.C.",
        TITLE = "Mining deep And-Or object structures via cost-sensitive
question-answer-based active annotations",
        JOURNAL = CVIU,
        VOLUME = "176-177",
        YEAR = "2018",
        PAGES = "33-44",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152658"}

@inproceedings{bb157128,
        AUTHOR = "Zhang, Q.S. and Cao, R. and Wu, Y.N. and Zhu, S.C.",
        TITLE = "Mining Object Parts from CNNs via Active Question-Answering",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "3890-3899",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152659"}

@inproceedings{bb157129,
        AUTHOR = "Zhang, Q.S. and Wu, Y.N. and Zhu, S.C.",
        TITLE = "Mining And-Or Graphs for Graph Matching and Object Discovery",
        BOOKTITLE = ICCV15,
        YEAR = "2015",
        PAGES = "55-63",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152660"}

@article{bb157130,
        AUTHOR = "Garg, S. and Srivastava, R.",
        TITLE = "Object sequences: encoding categorical and spatial information for a
yes/no visual question answering task",
        JOURNAL = IET-CV,
        VOLUME = "12",
        YEAR = "2018",
        NUMBER = "8",
        MONTH = "December",
        PAGES = "1141-1150",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152661"}

@article{bb157131,
        AUTHOR = "Goyal, Y. and Khot, T. and Agrawal, A. and Summers Stay, D. and Batra, D. and Parikh, D.",
        TITLE = "Making the V in VQA Matter: Elevating the Role of Image Understanding
in Visual Question Answering",
        JOURNAL = IJCV,
        VOLUME = "127",
        YEAR = "2019",
        NUMBER = "4",
        MONTH = "April",
        PAGES = "398-414",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152662"}

@inproceedings{bb157132,
        AUTHOR = "Goyal, Y. and Khot, T. and Summers Stay, D. and Batra, D. and Parikh, D.",
        TITLE = "Making the V in VQA Matter: Elevating the Role of Image Understanding
in Visual Question Answering",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6325-6334",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152662"}

@article{bb157133,
        AUTHOR = "Fang, Z.W. and Liu, J. and Li, Y. and Qiao, Y.Y. and Lu, H.Q.",
        TITLE = "Improving visual question answering using dropout and enhanced
question encoder",
        JOURNAL = PR,
        VOLUME = "90",
        YEAR = "2019",
        PAGES = "404-414",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152663"}

@article{bb157134,
        AUTHOR = "Das, A. and Kottur, S. and Gupta, K. and Singh, A. and Yadav, D. and Lee, S. and Moura, J.M.F. and Parikh, D. and Batra, D.",
        TITLE = "Visual Dialog",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "1242-1256",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152664"}

@article{bb157135,
        AUTHOR = "Osman, A. and Samek, W.",
        TITLE = "DRAU: Dual Recurrent Attention Units for Visual Question Answering",
        JOURNAL = CVIU,
        VOLUME = "185",
        YEAR = "2019",
        PAGES = "24-30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152665"}

@article{bb157136,
        AUTHOR = "Liang, J.W. and Jiang, L. and Cao, L.L. and Kalantidis, Y. and Li, L.J. and Hauptmann, A.G.",
        TITLE = "Focal Visual-Text Attention for Memex Question Answering",
        JOURNAL = PAMI,
        VOLUME = "41",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1893-1908",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152666"}

@inproceedings{bb157137,
        AUTHOR = "Liang, J.W. and Jiang, L. and Cao, L.L. and Li, L.J. and Hauptmann, A.G.",
        TITLE = "Focal Visual-Text Attention for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6135-6143",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152667"}

@article{bb157138,
        AUTHOR = "Zhao, Z. and Zhang, Z. and Jiang, X.H. and Cai, D.",
        TITLE = "Multi-Turn Video Question Answering via Hierarchical Attention
Context Reinforced Networks",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "3860-3872",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152668"}

@article{bb157139,
        AUTHOR = "Zhao, Z. and Zhang, Z. and Xiao, S.W. and Xiao, Z.X. and Yan, X.H. and Yu, J. and Cai, D. and Wu, F.",
        TITLE = "Long-Form Video Question Answering via Dynamic Hierarchical
Reinforced Networks",
        JOURNAL = IP,
        VOLUME = "28",
        YEAR = "2019",
        NUMBER = "12",
        MONTH = "December",
        PAGES = "5939-5952",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152669"}

@article{bb157140,
        AUTHOR = "Jang, Y. and Song, Y. and Kim, C.D. and Yu, Y. and Kim, Y. and Kim, G.",
        TITLE = "Video Question Answering with Spatio-Temporal Reasoning",
        JOURNAL = IJCV,
        VOLUME = "127",
        YEAR = "2019",
        NUMBER = "10",
        MONTH = "October",
        PAGES = "1385-1412",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152670"}

@inproceedings{bb157141,
        AUTHOR = "Jang, Y. and Song, Y. and Yu, Y. and Kim, Y. and Kim, G.",
        TITLE = "TGIF-QA:
Toward Spatio-Temporal Reasoning in Visual Question Answering",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "1359-1367",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152671"}

@article{bb157142,
        AUTHOR = "Toor, A.S. and Wechsler, H. and Nappi, M.",
        TITLE = "Biometric surveillance using visual question answering",
        JOURNAL = PRL,
        VOLUME = "126",
        YEAR = "2019",
        PAGES = "111-118",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152672"}

@article{bb157143,
        AUTHOR = "Wang, A. and Luu, A.T. and Foo, C. and Zhu, H. and Tay, Y. and Chandrasekhar, V.",
        TITLE = "Holistic Multi-Modal Memory Network for Movie Question Answering",
        JOURNAL = IP,
        VOLUME = "29",
        YEAR = "2020",
        NUMBER = "1",
        PAGES = "489-499",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152673"}

@article{bb157144,
        AUTHOR = "Yu, T. and Yu, J. and Yu, Z. and Tao, D.",
        TITLE = "Compositional Attention Networks With Two-Stream Fusion for Video
Question Answering",
        JOURNAL = IP,
        VOLUME = "29",
        YEAR = "2020",
        NUMBER = "",
        PAGES = "1204-1218",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152674"}

@article{bb157145,
        AUTHOR = "Ruwa, N. and Mao, Q. and Song, H.P. and Jia, H.J. and Dong, M.",
        TITLE = "Triple attention network for sentimental visual question answering",
        JOURNAL = CVIU,
        VOLUME = "189",
        YEAR = "2019",
        PAGES = "102829",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152675"}

@article{bb157146,
        AUTHOR = "Li, W.W. and Song, M.M. and Tian, Y.Y.",
        TITLE = "An Ontology-Driven Cyberinfrastructure for Intelligent Spatiotemporal
Question Answering and Open Knowledge Discovery",
        JOURNAL = IJGI,
        VOLUME = "8",
        YEAR = "2019",
        NUMBER = "11",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152676"}

@article{bb157147,
        AUTHOR = "Xi, Y.L. and Zhang, Y.N. and Ding, S.T. and Wan, S.H.",
        TITLE = "Visual question answering model based on visual relationship
detection",
        JOURNAL = SP:IC,
        VOLUME = "80",
        YEAR = "2020",
        PAGES = "115648",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152677"}

@inproceedings{bb157148,
        AUTHOR = "Qiu, Y. and Satoh, Y. and Suzuki, R. and Kataoka, H.",
        TITLE = "Incorporating 3D Information Into Visual Question Answering",
        BOOKTITLE = "3DV19",
        YEAR = "2019",
        PAGES = "756-765",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152678"}

@inproceedings{bb157149,
        AUTHOR = "Haurilet, M. and Al Halah, Z. and Stiefelhagen, R.",
        TITLE = "DynGraph: Visual Question Answering via Dynamic Scene Graphs",
        BOOKTITLE = GCPR19,
        YEAR = "2019",
        PAGES = "428-441",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152679"}

@inproceedings{bb157150,
        AUTHOR = "Haurilet, M. and Al Halah, Z. and Stiefelhagen, R.",
        TITLE = "MoQA: A Multi-modal Question Answering Architecture",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:106-113",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152680"}

@inproceedings{bb157151,
        AUTHOR = "Liu, F. and Liu, J. and Fang, Z. and Lu, H.",
        TITLE = "Language and Visual Relations Encoding for Visual Question Answering",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3307-3311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152681"}

@inproceedings{bb157152,
        AUTHOR = "Liu, C.N. and Chen, D.J. and Chen, H.T. and Liu, T.L.",
        TITLE = "A2A: Attention to Attention Reasoning for Movie Question Answering",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "VI:404-419",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152682"}

@inproceedings{bb157153,
        AUTHOR = "Fang, Z.W. and Liu, J. and Tang, Q. and Li, Y. and Lu, H.Q.",
        TITLE = "Answer Distillation for Visual Question Answering",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "I:72-87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152683"}

@inproceedings{bb157154,
        AUTHOR = "Messina, N. and Amato, G. and Carrara, F. and Falchi, F. and Gennaro, C.",
        TITLE = "Learning Relationship-Aware Visual Features",
        BOOKTITLE = CEFR-LCV18,
        YEAR = "2018",
        PAGES = "IV:486-501",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152684"}

@inproceedings{bb157155,
        AUTHOR = "Kuhnle, A. and Xie, H.Y. and Copestake, A.",
        TITLE = "How Clever Is the FiLM Model, and How Clever Can it Be?",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:162-172",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152685"}

@inproceedings{bb157156,
        AUTHOR = "Li, W. and Yuan, Z.H. and Fang, X.Z. and Wang, C.",
        TITLE = "Knowing Where to Look? Analysis on Attention of Visual Question
Answering System",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:145-152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152686"}

@inproceedings{bb157157,
        AUTHOR = "Bani, G. and Belli, D. and Dagan, G. and Geenen, A. and Skliar, A. and Venkatesh, A. and Baumgartner, T. and Bruni, E. and Fernandez, R.",
        TITLE = "Adding Object Detection Skills to Visual Dialogue Agents",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:180-187",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152687"}

@inproceedings{bb157158,
        AUTHOR = "Wagner, M. and Basevi, H. and Shetty, R. and Li, W.B. and Malinowski, M. and Fritz, M. and Leonardis, A.",
        TITLE = "Answering Visual What-If Questions: From Actions to Predicted Scene
Descriptions",
        BOOKTITLE = VLEASE18,
        YEAR = "2018",
        PAGES = "I:521-537",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152688"}

@inproceedings{bb157159,
        AUTHOR = "Zhang, Y. and Niebles, J.C. and Soto, A.",
        TITLE = "Interpretable Visual Question Answering by Visual Grounding From
Attention Supervision Mining",
        BOOKTITLE = WACV19,
        YEAR = "2019",
        PAGES = "349-357",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152689"}

@inproceedings{bb157160,
        AUTHOR = "Zhuang, B. and Wu, Q. and Shen, C. and Reid, I.D. and van den Hengel, A.J.",
        TITLE = "Parallel Attention: A Unified Framework for Visual Object Discovery
Through Dialogs and Queries",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4252-4261",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152690"}

@inproceedings{bb157161,
        AUTHOR = "Yang, M. and Yang, N.S.R. and Zhang, K. and Tao, J.",
        TITLE = "Self-Talk: Responses to Users' Opinions and Challenges in Human
Computer Dialog",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "2839-2844",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152691"}

@inproceedings{bb157162,
        AUTHOR = "Duke, B. and Taylor, G.W.",
        TITLE = "Generalized Hadamard-Product Fusion Operators for Visual Question
Answering",
        BOOKTITLE = CRV18,
        YEAR = "2018",
        PAGES = "39-46",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152692"}

@inproceedings{bb157163,
        AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
        TITLE = "Embodied Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152693"}

@inproceedings{bb157164,
        AUTHOR = "Misra, I. and Girshick, R. and Fergus, R. and Hebert, M. and Gupta, A. and van der Maaten, L.",
        TITLE = "Learning by Asking Questions",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "11-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152694"}

@inproceedings{bb157165,
        AUTHOR = "Gurari, D. and Li, Q. and Stangl, A.J. and Guo, A. and Lin, C. and Grauman, K. and Luo, J. and Bigham, J.P.",
        TITLE = "VizWiz Grand Challenge: Answering Visual Questions from Blind People",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "3608-3617",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152695"}

@inproceedings{bb157166,
        AUTHOR = "Li, J. and Su, H. and Zhu, J. and Wang, S. and Zhang, B.",
        TITLE = "Textbook Question Answering Under Instructor Guidance with Memory
Networks",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "3655-3663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152696"}

@inproceedings{bb157167,
        AUTHOR = "Gordon, D. and Kembhavi, A. and Rastegari, M. and Redmon, J. and Fox, D. and Farhadi, A.",
        TITLE = "IQA: Visual Question Answering in Interactive Environments",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4089-4098",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152697"}

@inproceedings{bb157168,
        AUTHOR = "Agrawal, A. and Batra, D. and Parikh, D. and Kembhavi, A.",
        TITLE = "Don't Just Assume; Look and Answer: Overcoming Priors for Visual
Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4971-4980",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152698"}

@inproceedings{bb157169,
        AUTHOR = "Sha, F. and Chao, W. and Hu, H.",
        TITLE = "Learning Answer Embeddings for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5428-5436",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152699"}

@inproceedings{bb157170,
        AUTHOR = "Kafle, K. and Price, B. and Cohen, S. and Kanan, C.",
        TITLE = "DVQA: Understanding Data Visualizations via Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5648-5656",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152700"}

@inproceedings{bb157171,
        AUTHOR = "Sha, F. and Hu, H. and Chao, W.",
        TITLE = "Cross-Dataset Adaptation for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5716-5725",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152701"}

@inproceedings{bb157172,
        AUTHOR = "Jain, U. and Schwing, A. and Lazebnik, S.",
        TITLE = "Two Can Play This Game: Visual Dialog with Discriminative Question
Generation and Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5754-5763",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152702"}

@inproceedings{bb157173,
        AUTHOR = "Anderson, P. and He, X. and Buehler, C. and Teney, D. and Johnson, M. and Gould, S. and Zhang, L.",
        TITLE = "Bottom-Up and Top-Down Attention for Image Captioning and Visual
Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6077-6086",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152703"}

@inproceedings{bb157174,
        AUTHOR = "Nguyen, D. and Okatani, T.",
        TITLE = "Improved Fusion of Visual and Language Representations by Dense
Symmetric Co-attention for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6087-6096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152704"}

@inproceedings{bb157175,
        AUTHOR = "Dokania, P.K. and Torr, P.H.S. and Siddharth, N. and Massiceti, D.",
        TITLE = "FLIPDIAL: A Generative Model for Two-Way Visual Dialogue",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6097-6105",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152705"}

@inproceedings{bb157176,
        AUTHOR = "Wu, Q. and Wang, P. and Shen, C. and Reid, I.D. and van den Hengel, A.J.",
        TITLE = "Are You Talking to Me? Reasoned Visual Dialog Generation Through
Adversarial Learning",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6106-6115",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152706"}

@inproceedings{bb157177,
        AUTHOR = "Gao, J. and Ge, R. and Chen, K. and Nevatia, R.",
        TITLE = "Motion-Appearance Co-memory Networks for Video Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6576-6585",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152707"}

@inproceedings{bb157178,
        AUTHOR = "Ma, C. and Shen, C. and Dick, A. and Wu, Q. and Wang, P. and van den Hengel, A.J. and Reid, I.D.",
        TITLE = "Visual Question Answering with Memory-Augmented Networks",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6975-6984",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152708"}

@inproceedings{bb157179,
        AUTHOR = "Cao, Q. and Liang, X. and Li, B. and Li, G. and Lin, L.",
        TITLE = "Visual Question Reasoning on General Dependency Tree",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7249-7257",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152709"}

@inproceedings{bb157180,
        AUTHOR = "Patro, B. and Namboodiri, V.P.",
        TITLE = "Differential Attention for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7680-7688",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152710"}

@inproceedings{bb157181,
        AUTHOR = "Su, Z. and Zhu, C. and Dong, Y. and Cai, D. and Chen, Y. and Li, J.",
        TITLE = "Learning Visual Knowledge Memory Networks for Visual Question
Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7736-7745",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152711"}

@inproceedings{bb157182,
        AUTHOR = "Liu, F. and Xiang, T. and Hospedales, T.M. and Yang, W. and Sun, C.",
        TITLE = "iVQA: Inverse Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "8611-8619",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152712"}

@inproceedings{bb157183,
        AUTHOR = "Shin, A. and Ushiku, Y. and Harada, T.",
        TITLE = "Customized Image Narrative Generation via Interactive Visual Question
Generation and Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "8925-8933",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152713"}

@inproceedings{bb157184,
        AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
        TITLE = "Embodied Question Answering",
        BOOKTITLE = DeepLearnRV18,
        YEAR = "2018",
        PAGES = "2135-213509",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152714"}

@inproceedings{bb157185,
        AUTHOR = "Cheng, W. and Huang, Y. and Wang, L.",
        TITLE = "Towards Unconstrained Pointing Problem of Visual Question Answering:
A Retrieval-based Method",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3303-3308",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152715"}

@inproceedings{bb157186,
        AUTHOR = "Teney, D. and Anderson, P. and He, X. and van den Hengel, A.J.",
        TITLE = "Tips and Tricks for Visual Question Answering:
Learnings from the 2017 Challenge",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4223-4232",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152716"}

@inproceedings{bb157187,
        AUTHOR = "Zhou, B. and Sun, Y. and Bau, D. and Torralba, A.",
        TITLE = "Interpretable Basis Decomposition for Visual Explanation",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 122-138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152717"}

@inproceedings{bb157188,
        AUTHOR = "Kottur, S. and Moura, J.M.F. and Parikh, D. and Batra, D. and Rohrbach, M.",
        TITLE = "Visual Coreference Resolution in Visual Dialog Using Neural Module
Networks",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 160-178",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152718"}

@inproceedings{bb157189,
        AUTHOR = "Strub, F. and Seurin, M. and Perez, E. and de Vries, H. and Mary, J. and Preux, P. and Courville, A. and Pietquin, O.",
        TITLE = "Visual Reasoning with Multi-hop Feature Modulation",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 808-831",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152719"}

@inproceedings{bb157190,
        AUTHOR = "Shi, Y. and Furlanello, T. and Zha, S. and Anandkumar, A.",
        TITLE = "Question Type Guided Attention in Visual Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 158-175",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152720"}

@inproceedings{bb157191,
        AUTHOR = "Narasimhan, M. and Schwing, A.G.",
        TITLE = "Straight to the Facts: Learning Knowledge Base Retrieval for Factual
Visual Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 460-477",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152721"}

@inproceedings{bb157192,
        AUTHOR = "Yang, G.R. and Ganichev, I. and Wang, X.J. and Shlens, J. and Sussillo, D.",
        TITLE = "A Dataset and Architecture for Visual Reasoning with a Working Memory",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "X: 729-745",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152722"}

@inproceedings{bb157193,
        AUTHOR = "Malinowski, M. and Doersch, C. and Santoro, A. and Battaglia, P.",
        TITLE = "Learning Visual Question Answering by Bootstrapping Hard Attention",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 3-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152723"}

@inproceedings{bb157194,
        AUTHOR = "Kim, K.M. and Choi, S.H. and Kim, J.H. and Zhang, B.T.",
        TITLE = "Multimodal Dual Attention Memory for Video Story Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XV: 698-713",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152724"}

@inproceedings{bb157195,
        AUTHOR = "Yu, Y.J. and Kim, J.S. and Kim, G.",
        TITLE = "A Joint Sequence Fusion Model for Video Question Answering and
Retrieval",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VII: 487-503",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152725"}

@inproceedings{bb157196,
        AUTHOR = "Gu, J.X. and Cai, J.F. and Joty, S. and Niu, L. and Wang, G.",
        TITLE = "Look, Imagine and Match: Improving Textual-Visual Cross-Modal
Retrieval with Generative Models",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7181-7189",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152726"}

@inproceedings{bb157197,
        AUTHOR = "Li, Q. and Tao, Q.Y. and Joty, S. and Cai, J.F. and Luo, J.B.",
        TITLE = "VQA-E: Explaining, Elaborating, and Enhancing Your Answers for Visual
Questions",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VII: 570-586",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152727"}

@inproceedings{bb157198,
        AUTHOR = "Bai, Y.L. and Fu, J.L. and Zhao, T.J. and Mei, T.",
        TITLE = "Deep Attention Neural Tensor Network for Visual Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XII: 21-37",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152728"}

@inproceedings{bb157199,
        AUTHOR = "Sinha, A. and Ayush, K.",
        TITLE = "Towards Mathematical Reasoning: A Multimodal Deep Learning Approach",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "4028-4032",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT152729"}

Last update:Dec 23, 2019 at 15:47:08