@inproceedings{bb239000,
        AUTHOR = "Qi, Y.G. and Zhang, K. and Sain, A. and Song, Y.Z.",
        TITLE = "PQA: Perceptual Question Answering",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "12051-12059",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233916"}

@inproceedings{bb239001,
        AUTHOR = "Yuan, Y.Y. and Wang, S. and Jiang, M.Y. and Chen, T.Y.",
        TITLE = "Perception Matters: Detecting Perception Failures of VQA Models Using
Metamorphic Testing",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "16903-16912",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233917"}

@inproceedings{bb239002,
        AUTHOR = "Marino, K. and Chen, X.L. and Parikh, D. and Gupta, A. and Rohrbach, M.",
        TITLE = "KRISP: Integrating Implicit and Symbolic Knowledge for Open-Domain
Knowledge-Based VQA",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "14106-14116",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233918"}

@inproceedings{bb239003,
        AUTHOR = "Niu, Y. and Tang, K. and Zhang, H.W. and Lu, Z.W. and Hua, X.S. and Wen, J.R.",
        TITLE = "Counterfactual VQA: A Cause-Effect Look at Language Bias",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "12695-12705",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233919"}

@inproceedings{bb239004,
        AUTHOR = "Yang, Z.Y. and Lu, Y.J. and Wang, J.F. and Yin, X. and Florencio, D. and Wang, L.J. and Zhang, C. and Zhang, L. and Luo, J.B.",
        TITLE = "TAP: Text-Aware Pre-training for Text-VQA and Text-Caption",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "8747-8757",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233920"}

@inproceedings{bb239005,
        AUTHOR = "Kervadec, C. and Jaunet, T. and Antipov, G. and Baccouche, M. and Vuillemot, R. and Wolf, C.",
        TITLE = "How Transferable are Reasoning Patterns in VQA?",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "4205-4214",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233921"}

@inproceedings{bb239006,
        AUTHOR = "Kervadec, C. and Antipov, G. and Baccouche, M. and Wolf, C.",
        TITLE = "Roses are Red, Violets are Blue… But Should VQA expect Them To?",
        BOOKTITLE = CVPR21,
        YEAR = "2021",
        PAGES = "2775-2784",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233922"}

@inproceedings{bb239007,
        AUTHOR = "Dua, R. and Kancheti, S.S. and Balasubramanian, V.N.",
        TITLE = "Beyond VQA: Generating Multi-word Answers and Rationales to Visual
Questions",
        BOOKTITLE = MULA21,
        YEAR = "2021",
        PAGES = "1623-1632",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233923"}

@inproceedings{bb239008,
        AUTHOR = "Rahman, T. and Chou, S.H. and Sigal, L. and Carenini, G.",
        TITLE = "An Improved Attention for Visual Question Answering",
        BOOKTITLE = MULA21,
        YEAR = "2021",
        PAGES = "1653-1662",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233924"}

@inproceedings{bb239009,
        AUTHOR = "Jolly, S. and Palacio, S. and Folz, J. and Raue, F. and Hees, J. and Dengel, A.",
        TITLE = "P ˜ NP, at least in Visual Question Answering",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "2748-2754",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233925"}

@inproceedings{bb239010,
        AUTHOR = "Mishra, A. and Anand, A. and Guha, P.",
        TITLE = "Multi-stage Attention based Visual Question Answering",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "9407-9414",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233926"}

@inproceedings{bb239011,
        AUTHOR = "Bozinis, T. and Passalis, N. and Tefas, A.",
        TITLE = "Improving Visual Question Answering using Active Perception on Static
Images",
        BOOKTITLE = ICPR21,
        YEAR = "2021",
        PAGES = "879-884",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233927"}

@inproceedings{bb239012,
        AUTHOR = "Sun, Q. and Xie, B.H. and Fu, Y.W.",
        TITLE = "Second Order Enhanced Multi-Glimpse Attention in Visual Question
Answering",
        BOOKTITLE = ACCV20,
        YEAR = "2020",
        PAGES = "IV:87-103",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233928"}

@inproceedings{bb239013,
        AUTHOR = "Goel, V. and Chandak, M. and Anand, A. and Guha, P.",
        TITLE = "IQ-VQA: Intelligent Visual Question Answering",
        BOOKTITLE = VTIUR20,
        YEAR = "2020",
        PAGES = "357-370",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233929"}

@inproceedings{bb239014,
        AUTHOR = "Qiao, Y. and Yu, Z. and Liu, J.",
        TITLE = "VC-VQA: Visual Calibration Mechanism For Visual Question Answering",
        BOOKTITLE = ICIP20,
        YEAR = "2020",
        PAGES = "1481-1485",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233930"}

@inproceedings{bb239015,
        AUTHOR = "Tang, R.X. and Ma, C. and Zhang, W.E. and Wu, Q. and Yang, X.K.",
        TITLE = "Semantic Equivalent Adversarial Data Augmentation for Visual Question
Answering",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XIX:437-453",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233931"}

@inproceedings{bb239016,
        AUTHOR = "Gokhale, T. and Banerjee, P. and Baral, C. and Yang, Y.Z.",
        TITLE = "VQA-LOL: Visual Question Answering Under the Lens of Logic",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXI:379-396",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233932"}

@inproceedings{bb239017,
        AUTHOR = "Yang, X.F. and Lin, G.S. and Lv, F.M. and Liu, F.Y.",
        TITLE = "TRRNET:
Tiered Relation Reasoning for Compositional Visual Question Answering",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXI:414-430",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233933"}

@inproceedings{bb239018,
        AUTHOR = "Bansal, A. and Zhang, Y. and Chellappa, R.",
        TITLE = "Visual Question Answering on Image Sets",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "XXI:51-67",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233934"}

@inproceedings{bb239019,
        AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Zhang, W.G. and Huang, Q.M. and Tian, Q.",
        TITLE = "Interpretable Visual Reasoning via Probabilistic Formulation Under
Natural Supervision",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "IX:553-570",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233935"}

@inproceedings{bb239020,
        AUTHOR = "Li, Q. and Huang, S.Y. and Hong, Y. and Zhu, S.C.",
        TITLE = "A Competence-aware Curriculum for Visual Concepts Learning via Question
Answering",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "II:141-157",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233936"}

@inproceedings{bb239021,
        AUTHOR = "Bajaj, G. and Bandyopadhyay, B. and Schmidt, D. and Maneriker, P. and Myers, C. and Parthasarathy, S.",
        TITLE = "Understanding Knowledge Gaps in Visual Question Answering:
Implications for Gap Identification and Testing",
        BOOKTITLE = MVM20,
        YEAR = "2020",
        PAGES = "1563-1566",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233937"}

@inproceedings{bb239022,
        AUTHOR = "Vatashsky, B. and Ullman, S.",
        TITLE = "VQA With No Questions-Answers Training",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10373-10383",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233938"}

@inproceedings{bb239023,
        AUTHOR = "Jiang, H. and Misra, I. and Rohrbach, M. and Learned Miller, E.G. and Chen, X.",
        TITLE = "In Defense of Grid Features for Visual Question Answering",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10264-10273",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233939"}

@inproceedings{bb239024,
        AUTHOR = "Wang, X. and Liu, Y. and Shen, C. and Ng, C.C. and Luo, C. and Jin, L. and Chan, C.S. and van den Hengel, A. and Wang, L.",
        TITLE = "On the General Value of Evidence, and Bilingual Scene-Text Visual
Question Answering",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10123-10132",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233940"}

@inproceedings{bb239025,
        AUTHOR = "Xiong, P. and Wu, Y.",
        TITLE = "TA-Student VQA: Multi-Agents Training by Self-Questioning",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "10062-10072",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233941"}

@inproceedings{bb239026,
        AUTHOR = "Agarwal, V. and Shetty, R. and Fritz, M.",
        TITLE = "Towards Causal VQA: Revealing and Reducing Spurious Correlations by
Invariant and Covariant Semantic Editing",
        BOOKTITLE = CVPR20,
        YEAR = "2020",
        PAGES = "9687-9695",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233942"}

@inproceedings{bb239027,
        AUTHOR = "Kafle, K. and Shrestha, R. and Price, B. and Cohen, S. and Kanan, C.",
        TITLE = "Answering Questions about Data Visualizations using Efficient Bimodal
Fusion",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1487-1496",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233943"}

@inproceedings{bb239028,
        AUTHOR = "Patro, B.N. and Patel, S. and Namboodiri, V.P.",
        TITLE = "Robust Explanations for Visual Question Answering",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1566-1575",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233944"}

@inproceedings{bb239029,
        AUTHOR = "Chou, S. and Chao, W. and Lai, W. and Sun, M. and Yang, M.",
        TITLE = "Visual Question Answering on 360° Images",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "1596-1605",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233945"}

@inproceedings{bb239030,
        AUTHOR = "Chaudhry, R. and Shekhar, S. and Gupta, U. and Maneriker, P. and Bansal, P. and Joshi, A.",
        TITLE = "LEAF-QA: Locate, Encode Attend for Figure Question Answering",
        BOOKTITLE = WACV20,
        YEAR = "2020",
        PAGES = "3501-3510",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233946"}

@inproceedings{bb239031,
        AUTHOR = "Liang, Y.Z. and Bai, Y.L. and Zhang, W. and Qian, X.M. and Zhu, L. and Mei, T.",
        TITLE = "VrR-VG: Refocusing Visually-Relevant Relationships",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "10402-10411",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233947"}

@inproceedings{bb239032,
        AUTHOR = "Bhattacharya, N. and Li, Q. and Gurari, D.",
        TITLE = "Why Does a Visual Question Have Different Answers?",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "4270-4279",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233948"}

@inproceedings{bb239033,
        AUTHOR = "Li, L.J. and Gan, Z. and Cheng, Y. and Liu, J.J.",
        TITLE = "Relation-Aware Graph Attention Network for Visual Question Answering",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "10312-10321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233949"}

@inproceedings{bb239034,
        AUTHOR = "Do, T. and Tran, H. and Do, T. and Tjiputra, E. and Tran, Q.",
        TITLE = "Compact Trilinear Interaction for Visual Question Answering",
        BOOKTITLE = ICCV19,
        YEAR = "2019",
        PAGES = "392-401",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233950"}

@inproceedings{bb239035,
        AUTHOR = "Schwartz, I. and Yu, S. and Hazan, T. and Schwing, A.G.",
        TITLE = "Factor Graph Attention",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "2039-2048",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233951"}

@inproceedings{bb239036,
        AUTHOR = "Kolesnikov, A. and Beyer, L. and Zhai, X.H. and Puigcerver, J. and Yung, J. and Gelly, S. and Houlsby, N.",
        TITLE = "Big Transfer (BIT): General Visual Representation Learning",
        BOOKTITLE = ECCV20,
        YEAR = "2020",
        PAGES = "V:491-507",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233952"}

@inproceedings{bb239037,
        AUTHOR = "Kolesnikov, A. and Zhai, X.H. and Beyer, L.",
        TITLE = "Revisiting Self-Supervised Visual Representation Learning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "1920-1929",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233953"}

@inproceedings{bb239038,
        AUTHOR = "Xiong, P.X. and Zhan, H.Y. and Wang, X. and Sinha, B. and Wu, Y.",
        TITLE = "Visual Query Answering by Entity-Attribute Graph Matching and Reasoning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8349-8358",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233954"}

@inproceedings{bb239039,
        AUTHOR = "Singh, A. and Natarajan, V. and Shah, M. and Jiang, Y. and Chen, X.L. and Batra, D. and Parikh, D. and Rohrbach, M.",
        TITLE = "Towards VQA Models That Can Read",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8309-8318",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233955"}

@inproceedings{bb239040,
        AUTHOR = "Manjunatha, V. and Saini, N. and Davis, L.S.",
        TITLE = "Explicit Bias Discovery in Visual Question Answering Models",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "9554-9563",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233956"}

@inproceedings{bb239041,
        AUTHOR = "Shrestha, R. and Kafle, K. and Kanan, C.",
        TITLE = "Answer Them All! Toward Universal Visual Question Answering Models",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "10464-10473",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233957"}

@inproceedings{bb239042,
        AUTHOR = "Noh, H. and Kim, T. and Mun, J. and Han, B.H.",
        TITLE = "Transfer Learning via Unsupervised Task Discovery for Visual Question
Answering",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "8377-8386",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233958"}

@inproceedings{bb239043,
        AUTHOR = "Wijmans, E. and Datta, S. and Maksymets, O. and Das, A. and Gkioxari, G. and Lee, S. and Essa, I. and Parikh, D. and Batra, D.",
        TITLE = "Embodied Question Answering in Photorealistic Environments With Point
Cloud Perception",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6652-6661",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233959"}

@inproceedings{bb239044,
        AUTHOR = "Shah, M. and Chen, X.L. and Rohrbach, M. and Parikh, D.",
        TITLE = "Cycle-Consistency for Robust Visual Question Answering",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6642-6651",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233960"}

@inproceedings{bb239045,
        AUTHOR = "Li, H. and Wang, P. and Shen, C.H. and van den Hengel, A.",
        TITLE = "Visual Question Answering as Reading Comprehension",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6312-6321",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233961"}

@inproceedings{bb239046,
        AUTHOR = "Yu, L.C. and Chen, X.L. and Gkioxari, G. and Bansal, M. and Berg, T.L. and Batra, D.",
        TITLE = "Multi-Target Embodied Question Answering",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6302-6311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233962"}

@inproceedings{bb239047,
        AUTHOR = "Yu, Z. and Yu, J. and Cui, Y.H. and Tao, D.C. and Tian, Q.",
        TITLE = "Deep Modular Co-Attention Networks for Visual Question Answering",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "6274-6283",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233963"}

@inproceedings{bb239048,
        AUTHOR = "Abbasnejad, E. and Wu, Q. and Shi, Q.F. and van den Hengel, A.",
        TITLE = "What's to Know? Uncertainty as a Guide to Asking Goal-Oriented
Questions",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "4150-4159",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233964"}

@inproceedings{bb239049,
        AUTHOR = "Schwenk, D. and Khandelwal, A. and Clark, C. and Marino, K. and Mottaghi, R.",
        TITLE = "A-OKVQA: A Benchmark for Visual Question Answering Using World
Knowledge",
        BOOKTITLE = ECCV22,
        YEAR = "2022",
        PAGES = "VIII:146-162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233965"}

@inproceedings{bb239050,
        AUTHOR = "Marino, K. and Rastegari, M. and Farhadi, A. and Mottaghi, R.",
        TITLE = "OK-VQA: A Visual Question Answering Benchmark Requiring External
Knowledge",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "3190-3199",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233966"}

@inproceedings{bb239051,
        AUTHOR = "Krishna, R. and Bernstein, M. and Fei Fei, L.",
        TITLE = "Information Maximizing Visual Question Generation",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "2008-2018",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233967"}

@inproceedings{bb239052,
        AUTHOR = "Haurilet, M. and Roitberg, A. and Stiefelhagen, R.",
        TITLE = "It's Not About the Journey; It's About the Destination: Following Soft
Paths Under Question-Guidance for Visual Reasoning",
        BOOKTITLE = CVPR19,
        YEAR = "2019",
        PAGES = "1930-1939",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233968"}

@inproceedings{bb239053,
        AUTHOR = "Qiu, Y. and Satoh, Y. and Suzuki, R. and Kataoka, H.",
        TITLE = "Incorporating 3D Information Into Visual Question Answering",
        BOOKTITLE = "3DV19",
        YEAR = "2019",
        PAGES = "756-765",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233969"}

@inproceedings{bb239054,
        AUTHOR = "Liu, F. and Liu, J. and Fang, Z. and Lu, H.",
        TITLE = "Language and Visual Relations Encoding for Visual Question Answering",
        BOOKTITLE = ICIP19,
        YEAR = "2019",
        PAGES = "3307-3311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233970"}

@inproceedings{bb239055,
        AUTHOR = "Fang, Z.W. and Liu, J. and Tang, Q. and Li, Y. and Lu, H.Q.",
        TITLE = "Answer Distillation for Visual Question Answering",
        BOOKTITLE = ACCV18,
        YEAR = "2018",
        PAGES = "I:72-87",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233971"}

@inproceedings{bb239056,
        AUTHOR = "Kuhnle, A. and Xie, H.Y. and Copestake, A.",
        TITLE = "How Clever Is the FiLM Model, and How Clever Can it Be?",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:162-172",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233972"}

@inproceedings{bb239057,
        AUTHOR = "Li, W. and Yuan, Z.H. and Fang, X.Z. and Wang, C.",
        TITLE = "Knowing Where to Look? Analysis on Attention of Visual Question
Answering System",
        BOOKTITLE = VL18,
        YEAR = "2018",
        PAGES = "IV:145-152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233973"}

@inproceedings{bb239058,
        AUTHOR = "Wagner, M. and Basevi, H. and Shetty, R. and Li, W.B. and Malinowski, M. and Fritz, M. and Leonardis, A.",
        TITLE = "Answering Visual What-If Questions: From Actions to Predicted Scene
Descriptions",
        BOOKTITLE = VLEASE18,
        YEAR = "2018",
        PAGES = "I:521-537",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233974"}

@inproceedings{bb239059,
        AUTHOR = "Duke, B. and Taylor, G.W.",
        TITLE = "Generalized Hadamard-Product Fusion Operators for Visual Question
Answering",
        BOOKTITLE = CRV18,
        YEAR = "2018",
        PAGES = "39-46",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233975"}

@inproceedings{bb239060,
        AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
        TITLE = "Embodied Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "1-10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233976"}

@inproceedings{bb239061,
        AUTHOR = "Misra, I. and Girshick, R. and Fergus, R. and Hebert, M. and Gupta, A. and van der Maaten, L.",
        TITLE = "Learning by Asking Questions",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "11-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233977"}

@inproceedings{bb239062,
        AUTHOR = "Gurari, D. and Li, Q. and Stangl, A.J. and Guo, A. and Lin, C. and Grauman, K. and Luo, J. and Bigham, J.P.",
        TITLE = "VizWiz Grand Challenge: Answering Visual Questions from Blind People",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "3608-3617",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233978"}

@inproceedings{bb239063,
        AUTHOR = "Li, J. and Su, H. and Zhu, J. and Wang, S. and Zhang, B.",
        TITLE = "Textbook Question Answering Under Instructor Guidance with Memory
Networks",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "3655-3663",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233979"}

@inproceedings{bb239064,
        AUTHOR = "Gordon, D. and Kembhavi, A. and Rastegari, M. and Redmon, J. and Fox, D. and Farhadi, A.",
        TITLE = "IQA: Visual Question Answering in Interactive Environments",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4089-4098",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233980"}

@inproceedings{bb239065,
        AUTHOR = "Agrawal, A. and Batra, D. and Parikh, D. and Kembhavi, A.",
        TITLE = "Don't Just Assume; Look and Answer: Overcoming Priors for Visual
Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "4971-4980",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233981"}

@inproceedings{bb239066,
        AUTHOR = "Sha, F. and Chao, W. and Hu, H.",
        TITLE = "Learning Answer Embeddings for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5428-5436",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233982"}

@inproceedings{bb239067,
        AUTHOR = "Kafle, K. and Price, B. and Cohen, S. and Kanan, C.",
        TITLE = "DVQA: Understanding Data Visualizations via Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5648-5656",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233983"}

@inproceedings{bb239068,
        AUTHOR = "Sha, F. and Hu, H. and Chao, W.",
        TITLE = "Cross-Dataset Adaptation for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "5716-5725",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233984"}

@inproceedings{bb239069,
        AUTHOR = "Anderson, P. and He, X. and Buehler, C. and Teney, D. and Johnson, M. and Gould, S. and Zhang, L.",
        TITLE = "Bottom-Up and Top-Down Attention for Image Captioning and Visual
Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6077-6086",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233985"}

@inproceedings{bb239070,
        AUTHOR = "Nguyen, D. and Okatani, T.",
        TITLE = "Improved Fusion of Visual and Language Representations by Dense
Symmetric Co-attention for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "6087-6096",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233986"}

@inproceedings{bb239071,
        AUTHOR = "Patro, B. and Namboodiri, V.P.",
        TITLE = "Differential Attention for Visual Question Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7680-7688",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233987"}

@inproceedings{bb239072,
        AUTHOR = "Su, Z. and Zhu, C. and Dong, Y.P. and Cai, D.Q. and Chen, Y.R. and Li, J.G.",
        TITLE = "Learning Visual Knowledge Memory Networks for Visual Question
Answering",
        BOOKTITLE = CVPR18,
        YEAR = "2018",
        PAGES = "7736-7745",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233988"}

@inproceedings{bb239073,
        AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
        TITLE = "Embodied Question Answering",
        BOOKTITLE = DeepLearnRV18,
        YEAR = "2018",
        PAGES = "2135-213509",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233989"}

@inproceedings{bb239074,
        AUTHOR = "Cheng, W. and Huang, Y. and Wang, L.",
        TITLE = "Towards Unconstrained Pointing Problem of Visual Question Answering:
A Retrieval-based Method",
        BOOKTITLE = ICPR18,
        YEAR = "2018",
        PAGES = "3303-3308",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233990"}

@inproceedings{bb239075,
        AUTHOR = "Zhou, B. and Sun, Y.Y. and Bau, D. and Torralba, A.B.",
        TITLE = "Interpretable Basis Decomposition for Visual Explanation",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 122-138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233991"}

@inproceedings{bb239076,
        AUTHOR = "Shi, Y. and Furlanello, T. and Zha, S. and Anandkumar, A.",
        TITLE = "Question Type Guided Attention in Visual Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "II: 158-175",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233992"}

@inproceedings{bb239077,
        AUTHOR = "Narasimhan, M. and Schwing, A.G.",
        TITLE = "Straight to the Facts: Learning Knowledge Base Retrieval for Factual
Visual Question Answering",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VIII: 460-477",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233993"}

@inproceedings{bb239078,
        AUTHOR = "Malinowski, M. and Doersch, C. and Santoro, A. and Battaglia, P.",
        TITLE = "Learning Visual Question Answering by Bootstrapping Hard Attention",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VI: 3-20",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233994"}

@inproceedings{bb239079,
        AUTHOR = "Li, Q. and Tao, Q.Y. and Joty, S. and Cai, J.F. and Luo, J.B.",
        TITLE = "VQA-E: Explaining, Elaborating, and Enhancing Your Answers for Visual
Questions",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "VII: 570-586",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233995"}

@inproceedings{bb239080,
        AUTHOR = "Yu, D. and Gao, X. and Xiong, H.",
        TITLE = "Structured Semantic Representation for Visual Question Answering",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "2286-2290",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233996"}

@inproceedings{bb239081,
        AUTHOR = "Huang, L. and Kulkarni, K. and Jha, A. and Lohit, S. and Jayasuriya, S. and Turaga, P.K.",
        TITLE = "CS-VQA: Visual Question Answering with Compressively Sensed Images",
        BOOKTITLE = ICIP18,
        YEAR = "2018",
        PAGES = "1283-1287",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233997"}

@inproceedings{bb239082,
        AUTHOR = "Desta, M.T. and Chen, L. and Kornuta, T.",
        TITLE = "Object-Based Reasoning in VQA",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1814-1823",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233998"}

@inproceedings{bb239083,
        AUTHOR = "Zhao, H. and Fan, Q. and Gutfreund, D. and Fu, Y.",
        TITLE = "Semantically Guided Visual Question Answering",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1852-1860",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233999"}

@inproceedings{bb239084,
        AUTHOR = "Wang, Z. and Liu, X. and Wang, L. and Qiao, Y. and Xie, X. and Fowlkes, C.C.",
        TITLE = "Structured Triplet Learning with POS-Tag Guided Attention for Visual
Question Answering",
        BOOKTITLE = WACV18,
        YEAR = "2018",
        PAGES = "1888-1896",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234000"}

@inproceedings{bb239085,
        AUTHOR = "Chowdhury, I. and Nguyen, K. and Fookes, C. and Sridharan, S.",
        TITLE = "A cascaded long short-term memory (LSTM) driven generic visual
question answering (VQA)",
        BOOKTITLE = ICIP17,
        YEAR = "2017",
        PAGES = "1842-1846",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234001"}

@inproceedings{bb239086,
        AUTHOR = "Jain, U. and Zhang, Z.Y. and Schwing, A.",
        TITLE = "Creativity: Generating Diverse Questions Using Variational
Autoencoders",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "5415-5424",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234002"}

@inproceedings{bb239087,
        AUTHOR = "Zhu, Y. and Lim, J.J. and Fei Fei, L.",
        TITLE = "Knowledge Acquisition for Visual Question Answering via Iterative
Querying",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6146-6155",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234003"}

@inproceedings{bb239088,
        AUTHOR = "Lin, Y.T. and Pang, Z.Y. and Li, Y. and Wang, D.H.",
        TITLE = "Simple and effective visual question answering in a single modality",
        BOOKTITLE = ICIP16,
        YEAR = "2016",
        PAGES = "2276-2280",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234004"}

@inproceedings{bb239089,
        AUTHOR = "Ganju, S. and Russakovsky, O. and Gupta, A.",
        TITLE = "What's in a Question:
Using Visual Questions as a Form of Supervision",
        BOOKTITLE = CVPR17,
        YEAR = "2017",
        PAGES = "6422-6431",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234005"}

@inproceedings{bb239090,
        AUTHOR = "Xu, H.J. and Saenko, K.",
        TITLE = "Ask, Attend and Answer:
Exploring Question-Guided Spatial Attention for Visual Question Answering",
        BOOKTITLE = ECCV16,
        YEAR = "2016",
        PAGES = "VII: 451-466",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234006"}

@inproceedings{bb239091,
        AUTHOR = "Jabri, A. and Joulin, A. and van der Maaten, L.",
        TITLE = "Revisiting Visual Question Answering Baselines",
        BOOKTITLE = ECCV16,
        YEAR = "2016",
        PAGES = "VIII: 727-739",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234007"}

@inproceedings{bb239092,
        AUTHOR = "Yang, Z.C. and He, X.D. and Gao, J.F. and Deng, L. and Smola, A.",
        TITLE = "Stacked Attention Networks for Image Question Answering",
        BOOKTITLE = CVPR16,
        YEAR = "2016",
        PAGES = "21-29",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234008"}

@inproceedings{bb239093,
        AUTHOR = "Sadeghi, F. and Divvala, S.K. and Farhadi, A.",
        TITLE = "VisKE: Visual knowledge extraction and question answering by visual
verification of relation phrases",
        BOOKTITLE = CVPR15,
        YEAR = "2015",
        PAGES = "1456-1464",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234009"}

@inproceedings{bb239094,
        AUTHOR = "Liu, Y. and Liu, J. and Wang, D. and Cheng, J.",
        TITLE = "A robust multivariate reranking algorithm for Question Answering
enrichment",
        BOOKTITLE = ICIP12,
        YEAR = "2012",
        PAGES = "1917-1920",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234010"}

@inproceedings{bb239095,
        AUTHOR = "Varekamp, C. and van de Walle, P. and de Putter, M.",
        TITLE = "Question interface for 3D picture creation on an autostereoscopic
digital picture frame",
        BOOKTITLE = "3DTV09",
        YEAR = "2009",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234011"}

@article{bb239096,
        AUTHOR = "Osman, A. and Samek, W.",
        TITLE = "DRAU: Dual Recurrent Attention Units for Visual Question Answering",
        JOURNAL = CVIU,
        VOLUME = "185",
        YEAR = "2019",
        PAGES = "24-30",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234012"}

@article{bb239097,
        AUTHOR = "Li, W. and Sun, J.H. and Liu, G. and Zhao, L.L. and Fang, X.Z.",
        TITLE = "Visual question answering with attention transfer and a cross-modal
gating mechanism",
        JOURNAL = PRL,
        VOLUME = "133",
        YEAR = "2020",
        PAGES = "334-340",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234013"}

@article{bb239098,
        AUTHOR = "Yu, J. and Zhu, Z.H. and Wang, Y.J. and Zhang, W.F. and Hu, Y. and Tan, J.L.",
        TITLE = "Cross-modal knowledge reasoning for knowledge-based visual question
answering",
        JOURNAL = PR,
        VOLUME = "108",
        YEAR = "2020",
        PAGES = "107563",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234014"}

@inproceedings{bb239099,
        AUTHOR = "Yang, Z.Q. and Qin, Z.C. and Yu, J. and Wan, T.",
        TITLE = "Prior Visual Relationship Reasoning For Visual Question Answering",
        BOOKTITLE = ICIP20,
        YEAR = "2020",
        PAGES = "1411-1415",
        BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234015"}

Last update:Jan 23, 2026 at 20:54:10