@inproceedings{bb239000,
AUTHOR = "Qi, Y.G. and Zhang, K. and Sain, A. and Song, Y.Z.",
TITLE = "PQA: Perceptual Question Answering",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "12051-12059",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233916"}
@inproceedings{bb239001,
AUTHOR = "Yuan, Y.Y. and Wang, S. and Jiang, M.Y. and Chen, T.Y.",
TITLE = "Perception Matters: Detecting Perception Failures of VQA Models Using
Metamorphic Testing",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "16903-16912",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233917"}
@inproceedings{bb239002,
AUTHOR = "Marino, K. and Chen, X.L. and Parikh, D. and Gupta, A. and Rohrbach, M.",
TITLE = "KRISP: Integrating Implicit and Symbolic Knowledge for Open-Domain
Knowledge-Based VQA",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "14106-14116",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233918"}
@inproceedings{bb239003,
AUTHOR = "Niu, Y. and Tang, K. and Zhang, H.W. and Lu, Z.W. and Hua, X.S. and Wen, J.R.",
TITLE = "Counterfactual VQA: A Cause-Effect Look at Language Bias",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "12695-12705",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233919"}
@inproceedings{bb239004,
AUTHOR = "Yang, Z.Y. and Lu, Y.J. and Wang, J.F. and Yin, X. and Florencio, D. and Wang, L.J. and Zhang, C. and Zhang, L. and Luo, J.B.",
TITLE = "TAP: Text-Aware Pre-training for Text-VQA and Text-Caption",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "8747-8757",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233920"}
@inproceedings{bb239005,
AUTHOR = "Kervadec, C. and Jaunet, T. and Antipov, G. and Baccouche, M. and Vuillemot, R. and Wolf, C.",
TITLE = "How Transferable are Reasoning Patterns in VQA?",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "4205-4214",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233921"}
@inproceedings{bb239006,
AUTHOR = "Kervadec, C. and Antipov, G. and Baccouche, M. and Wolf, C.",
TITLE = "Roses are Red, Violets are Blue… But Should VQA expect Them To?",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "2775-2784",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233922"}
@inproceedings{bb239007,
AUTHOR = "Dua, R. and Kancheti, S.S. and Balasubramanian, V.N.",
TITLE = "Beyond VQA: Generating Multi-word Answers and Rationales to Visual
Questions",
BOOKTITLE = MULA21,
YEAR = "2021",
PAGES = "1623-1632",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233923"}
@inproceedings{bb239008,
AUTHOR = "Rahman, T. and Chou, S.H. and Sigal, L. and Carenini, G.",
TITLE = "An Improved Attention for Visual Question Answering",
BOOKTITLE = MULA21,
YEAR = "2021",
PAGES = "1653-1662",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233924"}
@inproceedings{bb239009,
AUTHOR = "Jolly, S. and Palacio, S. and Folz, J. and Raue, F. and Hees, J. and Dengel, A.",
TITLE = "P ˜ NP, at least in Visual Question Answering",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "2748-2754",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233925"}
@inproceedings{bb239010,
AUTHOR = "Mishra, A. and Anand, A. and Guha, P.",
TITLE = "Multi-stage Attention based Visual Question Answering",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "9407-9414",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233926"}
@inproceedings{bb239011,
AUTHOR = "Bozinis, T. and Passalis, N. and Tefas, A.",
TITLE = "Improving Visual Question Answering using Active Perception on Static
Images",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "879-884",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233927"}
@inproceedings{bb239012,
AUTHOR = "Sun, Q. and Xie, B.H. and Fu, Y.W.",
TITLE = "Second Order Enhanced Multi-Glimpse Attention in Visual Question
Answering",
BOOKTITLE = ACCV20,
YEAR = "2020",
PAGES = "IV:87-103",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233928"}
@inproceedings{bb239013,
AUTHOR = "Goel, V. and Chandak, M. and Anand, A. and Guha, P.",
TITLE = "IQ-VQA: Intelligent Visual Question Answering",
BOOKTITLE = VTIUR20,
YEAR = "2020",
PAGES = "357-370",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233929"}
@inproceedings{bb239014,
AUTHOR = "Qiao, Y. and Yu, Z. and Liu, J.",
TITLE = "VC-VQA: Visual Calibration Mechanism For Visual Question Answering",
BOOKTITLE = ICIP20,
YEAR = "2020",
PAGES = "1481-1485",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233930"}
@inproceedings{bb239015,
AUTHOR = "Tang, R.X. and Ma, C. and Zhang, W.E. and Wu, Q. and Yang, X.K.",
TITLE = "Semantic Equivalent Adversarial Data Augmentation for Visual Question
Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XIX:437-453",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233931"}
@inproceedings{bb239016,
AUTHOR = "Gokhale, T. and Banerjee, P. and Baral, C. and Yang, Y.Z.",
TITLE = "VQA-LOL: Visual Question Answering Under the Lens of Logic",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:379-396",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233932"}
@inproceedings{bb239017,
AUTHOR = "Yang, X.F. and Lin, G.S. and Lv, F.M. and Liu, F.Y.",
TITLE = "TRRNET:
Tiered Relation Reasoning for Compositional Visual Question Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:414-430",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233933"}
@inproceedings{bb239018,
AUTHOR = "Bansal, A. and Zhang, Y. and Chellappa, R.",
TITLE = "Visual Question Answering on Image Sets",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:51-67",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233934"}
@inproceedings{bb239019,
AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Zhang, W.G. and Huang, Q.M. and Tian, Q.",
TITLE = "Interpretable Visual Reasoning via Probabilistic Formulation Under
Natural Supervision",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "IX:553-570",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233935"}
@inproceedings{bb239020,
AUTHOR = "Li, Q. and Huang, S.Y. and Hong, Y. and Zhu, S.C.",
TITLE = "A Competence-aware Curriculum for Visual Concepts Learning via Question
Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "II:141-157",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233936"}
@inproceedings{bb239021,
AUTHOR = "Bajaj, G. and Bandyopadhyay, B. and Schmidt, D. and Maneriker, P. and Myers, C. and Parthasarathy, S.",
TITLE = "Understanding Knowledge Gaps in Visual Question Answering:
Implications for Gap Identification and Testing",
BOOKTITLE = MVM20,
YEAR = "2020",
PAGES = "1563-1566",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233937"}
@inproceedings{bb239022,
AUTHOR = "Vatashsky, B. and Ullman, S.",
TITLE = "VQA With No Questions-Answers Training",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10373-10383",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233938"}
@inproceedings{bb239023,
AUTHOR = "Jiang, H. and Misra, I. and Rohrbach, M. and Learned Miller, E.G. and Chen, X.",
TITLE = "In Defense of Grid Features for Visual Question Answering",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10264-10273",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233939"}
@inproceedings{bb239024,
AUTHOR = "Wang, X. and Liu, Y. and Shen, C. and Ng, C.C. and Luo, C. and Jin, L. and Chan, C.S. and van den Hengel, A. and Wang, L.",
TITLE = "On the General Value of Evidence, and Bilingual Scene-Text Visual
Question Answering",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10123-10132",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233940"}
@inproceedings{bb239025,
AUTHOR = "Xiong, P. and Wu, Y.",
TITLE = "TA-Student VQA: Multi-Agents Training by Self-Questioning",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10062-10072",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233941"}
@inproceedings{bb239026,
AUTHOR = "Agarwal, V. and Shetty, R. and Fritz, M.",
TITLE = "Towards Causal VQA: Revealing and Reducing Spurious Correlations by
Invariant and Covariant Semantic Editing",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "9687-9695",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233942"}
@inproceedings{bb239027,
AUTHOR = "Kafle, K. and Shrestha, R. and Price, B. and Cohen, S. and Kanan, C.",
TITLE = "Answering Questions about Data Visualizations using Efficient Bimodal
Fusion",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1487-1496",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233943"}
@inproceedings{bb239028,
AUTHOR = "Patro, B.N. and Patel, S. and Namboodiri, V.P.",
TITLE = "Robust Explanations for Visual Question Answering",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1566-1575",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233944"}
@inproceedings{bb239029,
AUTHOR = "Chou, S. and Chao, W. and Lai, W. and Sun, M. and Yang, M.",
TITLE = "Visual Question Answering on 360° Images",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1596-1605",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233945"}
@inproceedings{bb239030,
AUTHOR = "Chaudhry, R. and Shekhar, S. and Gupta, U. and Maneriker, P. and Bansal, P. and Joshi, A.",
TITLE = "LEAF-QA: Locate, Encode Attend for Figure Question Answering",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "3501-3510",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233946"}
@inproceedings{bb239031,
AUTHOR = "Liang, Y.Z. and Bai, Y.L. and Zhang, W. and Qian, X.M. and Zhu, L. and Mei, T.",
TITLE = "VrR-VG: Refocusing Visually-Relevant Relationships",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "10402-10411",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233947"}
@inproceedings{bb239032,
AUTHOR = "Bhattacharya, N. and Li, Q. and Gurari, D.",
TITLE = "Why Does a Visual Question Have Different Answers?",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "4270-4279",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233948"}
@inproceedings{bb239033,
AUTHOR = "Li, L.J. and Gan, Z. and Cheng, Y. and Liu, J.J.",
TITLE = "Relation-Aware Graph Attention Network for Visual Question Answering",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "10312-10321",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233949"}
@inproceedings{bb239034,
AUTHOR = "Do, T. and Tran, H. and Do, T. and Tjiputra, E. and Tran, Q.",
TITLE = "Compact Trilinear Interaction for Visual Question Answering",
BOOKTITLE = ICCV19,
YEAR = "2019",
PAGES = "392-401",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233950"}
@inproceedings{bb239035,
AUTHOR = "Schwartz, I. and Yu, S. and Hazan, T. and Schwing, A.G.",
TITLE = "Factor Graph Attention",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "2039-2048",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233951"}
@inproceedings{bb239036,
AUTHOR = "Kolesnikov, A. and Beyer, L. and Zhai, X.H. and Puigcerver, J. and Yung, J. and Gelly, S. and Houlsby, N.",
TITLE = "Big Transfer (BIT): General Visual Representation Learning",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "V:491-507",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233952"}
@inproceedings{bb239037,
AUTHOR = "Kolesnikov, A. and Zhai, X.H. and Beyer, L.",
TITLE = "Revisiting Self-Supervised Visual Representation Learning",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "1920-1929",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233953"}
@inproceedings{bb239038,
AUTHOR = "Xiong, P.X. and Zhan, H.Y. and Wang, X. and Sinha, B. and Wu, Y.",
TITLE = "Visual Query Answering by Entity-Attribute Graph Matching and Reasoning",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "8349-8358",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233954"}
@inproceedings{bb239039,
AUTHOR = "Singh, A. and Natarajan, V. and Shah, M. and Jiang, Y. and Chen, X.L. and Batra, D. and Parikh, D. and Rohrbach, M.",
TITLE = "Towards VQA Models That Can Read",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "8309-8318",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233955"}
@inproceedings{bb239040,
AUTHOR = "Manjunatha, V. and Saini, N. and Davis, L.S.",
TITLE = "Explicit Bias Discovery in Visual Question Answering Models",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "9554-9563",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233956"}
@inproceedings{bb239041,
AUTHOR = "Shrestha, R. and Kafle, K. and Kanan, C.",
TITLE = "Answer Them All! Toward Universal Visual Question Answering Models",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "10464-10473",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233957"}
@inproceedings{bb239042,
AUTHOR = "Noh, H. and Kim, T. and Mun, J. and Han, B.H.",
TITLE = "Transfer Learning via Unsupervised Task Discovery for Visual Question
Answering",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "8377-8386",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233958"}
@inproceedings{bb239043,
AUTHOR = "Wijmans, E. and Datta, S. and Maksymets, O. and Das, A. and Gkioxari, G. and Lee, S. and Essa, I. and Parikh, D. and Batra, D.",
TITLE = "Embodied Question Answering in Photorealistic Environments With Point
Cloud Perception",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6652-6661",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233959"}
@inproceedings{bb239044,
AUTHOR = "Shah, M. and Chen, X.L. and Rohrbach, M. and Parikh, D.",
TITLE = "Cycle-Consistency for Robust Visual Question Answering",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6642-6651",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233960"}
@inproceedings{bb239045,
AUTHOR = "Li, H. and Wang, P. and Shen, C.H. and van den Hengel, A.",
TITLE = "Visual Question Answering as Reading Comprehension",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6312-6321",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233961"}
@inproceedings{bb239046,
AUTHOR = "Yu, L.C. and Chen, X.L. and Gkioxari, G. and Bansal, M. and Berg, T.L. and Batra, D.",
TITLE = "Multi-Target Embodied Question Answering",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6302-6311",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233962"}
@inproceedings{bb239047,
AUTHOR = "Yu, Z. and Yu, J. and Cui, Y.H. and Tao, D.C. and Tian, Q.",
TITLE = "Deep Modular Co-Attention Networks for Visual Question Answering",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "6274-6283",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233963"}
@inproceedings{bb239048,
AUTHOR = "Abbasnejad, E. and Wu, Q. and Shi, Q.F. and van den Hengel, A.",
TITLE = "What's to Know? Uncertainty as a Guide to Asking Goal-Oriented
Questions",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "4150-4159",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233964"}
@inproceedings{bb239049,
AUTHOR = "Schwenk, D. and Khandelwal, A. and Clark, C. and Marino, K. and Mottaghi, R.",
TITLE = "A-OKVQA: A Benchmark for Visual Question Answering Using World
Knowledge",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "VIII:146-162",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233965"}
@inproceedings{bb239050,
AUTHOR = "Marino, K. and Rastegari, M. and Farhadi, A. and Mottaghi, R.",
TITLE = "OK-VQA: A Visual Question Answering Benchmark Requiring External
Knowledge",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "3190-3199",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233966"}
@inproceedings{bb239051,
AUTHOR = "Krishna, R. and Bernstein, M. and Fei Fei, L.",
TITLE = "Information Maximizing Visual Question Generation",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "2008-2018",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233967"}
@inproceedings{bb239052,
AUTHOR = "Haurilet, M. and Roitberg, A. and Stiefelhagen, R.",
TITLE = "It's Not About the Journey; It's About the Destination: Following Soft
Paths Under Question-Guidance for Visual Reasoning",
BOOKTITLE = CVPR19,
YEAR = "2019",
PAGES = "1930-1939",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233968"}
@inproceedings{bb239053,
AUTHOR = "Qiu, Y. and Satoh, Y. and Suzuki, R. and Kataoka, H.",
TITLE = "Incorporating 3D Information Into Visual Question Answering",
BOOKTITLE = "3DV19",
YEAR = "2019",
PAGES = "756-765",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233969"}
@inproceedings{bb239054,
AUTHOR = "Liu, F. and Liu, J. and Fang, Z. and Lu, H.",
TITLE = "Language and Visual Relations Encoding for Visual Question Answering",
BOOKTITLE = ICIP19,
YEAR = "2019",
PAGES = "3307-3311",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233970"}
@inproceedings{bb239055,
AUTHOR = "Fang, Z.W. and Liu, J. and Tang, Q. and Li, Y. and Lu, H.Q.",
TITLE = "Answer Distillation for Visual Question Answering",
BOOKTITLE = ACCV18,
YEAR = "2018",
PAGES = "I:72-87",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233971"}
@inproceedings{bb239056,
AUTHOR = "Kuhnle, A. and Xie, H.Y. and Copestake, A.",
TITLE = "How Clever Is the FiLM Model, and How Clever Can it Be?",
BOOKTITLE = VL18,
YEAR = "2018",
PAGES = "IV:162-172",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233972"}
@inproceedings{bb239057,
AUTHOR = "Li, W. and Yuan, Z.H. and Fang, X.Z. and Wang, C.",
TITLE = "Knowing Where to Look? Analysis on Attention of Visual Question
Answering System",
BOOKTITLE = VL18,
YEAR = "2018",
PAGES = "IV:145-152",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233973"}
@inproceedings{bb239058,
AUTHOR = "Wagner, M. and Basevi, H. and Shetty, R. and Li, W.B. and Malinowski, M. and Fritz, M. and Leonardis, A.",
TITLE = "Answering Visual What-If Questions: From Actions to Predicted Scene
Descriptions",
BOOKTITLE = VLEASE18,
YEAR = "2018",
PAGES = "I:521-537",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233974"}
@inproceedings{bb239059,
AUTHOR = "Duke, B. and Taylor, G.W.",
TITLE = "Generalized Hadamard-Product Fusion Operators for Visual Question
Answering",
BOOKTITLE = CRV18,
YEAR = "2018",
PAGES = "39-46",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233975"}
@inproceedings{bb239060,
AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
TITLE = "Embodied Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "1-10",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233976"}
@inproceedings{bb239061,
AUTHOR = "Misra, I. and Girshick, R. and Fergus, R. and Hebert, M. and Gupta, A. and van der Maaten, L.",
TITLE = "Learning by Asking Questions",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "11-20",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233977"}
@inproceedings{bb239062,
AUTHOR = "Gurari, D. and Li, Q. and Stangl, A.J. and Guo, A. and Lin, C. and Grauman, K. and Luo, J. and Bigham, J.P.",
TITLE = "VizWiz Grand Challenge: Answering Visual Questions from Blind People",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "3608-3617",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233978"}
@inproceedings{bb239063,
AUTHOR = "Li, J. and Su, H. and Zhu, J. and Wang, S. and Zhang, B.",
TITLE = "Textbook Question Answering Under Instructor Guidance with Memory
Networks",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "3655-3663",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233979"}
@inproceedings{bb239064,
AUTHOR = "Gordon, D. and Kembhavi, A. and Rastegari, M. and Redmon, J. and Fox, D. and Farhadi, A.",
TITLE = "IQA: Visual Question Answering in Interactive Environments",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "4089-4098",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233980"}
@inproceedings{bb239065,
AUTHOR = "Agrawal, A. and Batra, D. and Parikh, D. and Kembhavi, A.",
TITLE = "Don't Just Assume; Look and Answer: Overcoming Priors for Visual
Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "4971-4980",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233981"}
@inproceedings{bb239066,
AUTHOR = "Sha, F. and Chao, W. and Hu, H.",
TITLE = "Learning Answer Embeddings for Visual Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "5428-5436",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233982"}
@inproceedings{bb239067,
AUTHOR = "Kafle, K. and Price, B. and Cohen, S. and Kanan, C.",
TITLE = "DVQA: Understanding Data Visualizations via Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "5648-5656",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233983"}
@inproceedings{bb239068,
AUTHOR = "Sha, F. and Hu, H. and Chao, W.",
TITLE = "Cross-Dataset Adaptation for Visual Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "5716-5725",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233984"}
@inproceedings{bb239069,
AUTHOR = "Anderson, P. and He, X. and Buehler, C. and Teney, D. and Johnson, M. and Gould, S. and Zhang, L.",
TITLE = "Bottom-Up and Top-Down Attention for Image Captioning and Visual
Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "6077-6086",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233985"}
@inproceedings{bb239070,
AUTHOR = "Nguyen, D. and Okatani, T.",
TITLE = "Improved Fusion of Visual and Language Representations by Dense
Symmetric Co-attention for Visual Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "6087-6096",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233986"}
@inproceedings{bb239071,
AUTHOR = "Patro, B. and Namboodiri, V.P.",
TITLE = "Differential Attention for Visual Question Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "7680-7688",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233987"}
@inproceedings{bb239072,
AUTHOR = "Su, Z. and Zhu, C. and Dong, Y.P. and Cai, D.Q. and Chen, Y.R. and Li, J.G.",
TITLE = "Learning Visual Knowledge Memory Networks for Visual Question
Answering",
BOOKTITLE = CVPR18,
YEAR = "2018",
PAGES = "7736-7745",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233988"}
@inproceedings{bb239073,
AUTHOR = "Das, A. and Datta, S. and Gkioxari, G. and Lee, S. and Parikh, D. and Batra, D.",
TITLE = "Embodied Question Answering",
BOOKTITLE = DeepLearnRV18,
YEAR = "2018",
PAGES = "2135-213509",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233989"}
@inproceedings{bb239074,
AUTHOR = "Cheng, W. and Huang, Y. and Wang, L.",
TITLE = "Towards Unconstrained Pointing Problem of Visual Question Answering:
A Retrieval-based Method",
BOOKTITLE = ICPR18,
YEAR = "2018",
PAGES = "3303-3308",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233990"}
@inproceedings{bb239075,
AUTHOR = "Zhou, B. and Sun, Y.Y. and Bau, D. and Torralba, A.B.",
TITLE = "Interpretable Basis Decomposition for Visual Explanation",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "VIII: 122-138",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233991"}
@inproceedings{bb239076,
AUTHOR = "Shi, Y. and Furlanello, T. and Zha, S. and Anandkumar, A.",
TITLE = "Question Type Guided Attention in Visual Question Answering",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "II: 158-175",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233992"}
@inproceedings{bb239077,
AUTHOR = "Narasimhan, M. and Schwing, A.G.",
TITLE = "Straight to the Facts: Learning Knowledge Base Retrieval for Factual
Visual Question Answering",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "VIII: 460-477",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233993"}
@inproceedings{bb239078,
AUTHOR = "Malinowski, M. and Doersch, C. and Santoro, A. and Battaglia, P.",
TITLE = "Learning Visual Question Answering by Bootstrapping Hard Attention",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "VI: 3-20",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233994"}
@inproceedings{bb239079,
AUTHOR = "Li, Q. and Tao, Q.Y. and Joty, S. and Cai, J.F. and Luo, J.B.",
TITLE = "VQA-E: Explaining, Elaborating, and Enhancing Your Answers for Visual
Questions",
BOOKTITLE = ECCV18,
YEAR = "2018",
PAGES = "VII: 570-586",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233995"}
@inproceedings{bb239080,
AUTHOR = "Yu, D. and Gao, X. and Xiong, H.",
TITLE = "Structured Semantic Representation for Visual Question Answering",
BOOKTITLE = ICIP18,
YEAR = "2018",
PAGES = "2286-2290",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233996"}
@inproceedings{bb239081,
AUTHOR = "Huang, L. and Kulkarni, K. and Jha, A. and Lohit, S. and Jayasuriya, S. and Turaga, P.K.",
TITLE = "CS-VQA: Visual Question Answering with Compressively Sensed Images",
BOOKTITLE = ICIP18,
YEAR = "2018",
PAGES = "1283-1287",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233997"}
@inproceedings{bb239082,
AUTHOR = "Desta, M.T. and Chen, L. and Kornuta, T.",
TITLE = "Object-Based Reasoning in VQA",
BOOKTITLE = WACV18,
YEAR = "2018",
PAGES = "1814-1823",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233998"}
@inproceedings{bb239083,
AUTHOR = "Zhao, H. and Fan, Q. and Gutfreund, D. and Fu, Y.",
TITLE = "Semantically Guided Visual Question Answering",
BOOKTITLE = WACV18,
YEAR = "2018",
PAGES = "1852-1860",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT233999"}
@inproceedings{bb239084,
AUTHOR = "Wang, Z. and Liu, X. and Wang, L. and Qiao, Y. and Xie, X. and Fowlkes, C.C.",
TITLE = "Structured Triplet Learning with POS-Tag Guided Attention for Visual
Question Answering",
BOOKTITLE = WACV18,
YEAR = "2018",
PAGES = "1888-1896",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234000"}
@inproceedings{bb239085,
AUTHOR = "Chowdhury, I. and Nguyen, K. and Fookes, C. and Sridharan, S.",
TITLE = "A cascaded long short-term memory (LSTM) driven generic visual
question answering (VQA)",
BOOKTITLE = ICIP17,
YEAR = "2017",
PAGES = "1842-1846",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234001"}
@inproceedings{bb239086,
AUTHOR = "Jain, U. and Zhang, Z.Y. and Schwing, A.",
TITLE = "Creativity: Generating Diverse Questions Using Variational
Autoencoders",
BOOKTITLE = CVPR17,
YEAR = "2017",
PAGES = "5415-5424",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234002"}
@inproceedings{bb239087,
AUTHOR = "Zhu, Y. and Lim, J.J. and Fei Fei, L.",
TITLE = "Knowledge Acquisition for Visual Question Answering via Iterative
Querying",
BOOKTITLE = CVPR17,
YEAR = "2017",
PAGES = "6146-6155",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234003"}
@inproceedings{bb239088,
AUTHOR = "Lin, Y.T. and Pang, Z.Y. and Li, Y. and Wang, D.H.",
TITLE = "Simple and effective visual question answering in a single modality",
BOOKTITLE = ICIP16,
YEAR = "2016",
PAGES = "2276-2280",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234004"}
@inproceedings{bb239089,
AUTHOR = "Ganju, S. and Russakovsky, O. and Gupta, A.",
TITLE = "What's in a Question:
Using Visual Questions as a Form of Supervision",
BOOKTITLE = CVPR17,
YEAR = "2017",
PAGES = "6422-6431",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234005"}
@inproceedings{bb239090,
AUTHOR = "Xu, H.J. and Saenko, K.",
TITLE = "Ask, Attend and Answer:
Exploring Question-Guided Spatial Attention for Visual Question Answering",
BOOKTITLE = ECCV16,
YEAR = "2016",
PAGES = "VII: 451-466",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234006"}
@inproceedings{bb239091,
AUTHOR = "Jabri, A. and Joulin, A. and van der Maaten, L.",
TITLE = "Revisiting Visual Question Answering Baselines",
BOOKTITLE = ECCV16,
YEAR = "2016",
PAGES = "VIII: 727-739",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234007"}
@inproceedings{bb239092,
AUTHOR = "Yang, Z.C. and He, X.D. and Gao, J.F. and Deng, L. and Smola, A.",
TITLE = "Stacked Attention Networks for Image Question Answering",
BOOKTITLE = CVPR16,
YEAR = "2016",
PAGES = "21-29",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234008"}
@inproceedings{bb239093,
AUTHOR = "Sadeghi, F. and Divvala, S.K. and Farhadi, A.",
TITLE = "VisKE: Visual knowledge extraction and question answering by visual
verification of relation phrases",
BOOKTITLE = CVPR15,
YEAR = "2015",
PAGES = "1456-1464",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234009"}
@inproceedings{bb239094,
AUTHOR = "Liu, Y. and Liu, J. and Wang, D. and Cheng, J.",
TITLE = "A robust multivariate reranking algorithm for Question Answering
enrichment",
BOOKTITLE = ICIP12,
YEAR = "2012",
PAGES = "1917-1920",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234010"}
@inproceedings{bb239095,
AUTHOR = "Varekamp, C. and van de Walle, P. and de Putter, M.",
TITLE = "Question interface for 3D picture creation on an autostereoscopic
digital picture frame",
BOOKTITLE = "3DTV09",
YEAR = "2009",
PAGES = "1-4",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234011"}
@article{bb239096,
AUTHOR = "Osman, A. and Samek, W.",
TITLE = "DRAU: Dual Recurrent Attention Units for Visual Question Answering",
JOURNAL = CVIU,
VOLUME = "185",
YEAR = "2019",
PAGES = "24-30",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234012"}
@article{bb239097,
AUTHOR = "Li, W. and Sun, J.H. and Liu, G. and Zhao, L.L. and Fang, X.Z.",
TITLE = "Visual question answering with attention transfer and a cross-modal
gating mechanism",
JOURNAL = PRL,
VOLUME = "133",
YEAR = "2020",
PAGES = "334-340",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234013"}
@article{bb239098,
AUTHOR = "Yu, J. and Zhu, Z.H. and Wang, Y.J. and Zhang, W.F. and Hu, Y. and Tan, J.L.",
TITLE = "Cross-modal knowledge reasoning for knowledge-based visual question
answering",
JOURNAL = PR,
VOLUME = "108",
YEAR = "2020",
PAGES = "107563",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234014"}
@inproceedings{bb239099,
AUTHOR = "Yang, Z.Q. and Qin, Z.C. and Yu, J. and Wan, T.",
TITLE = "Prior Visual Relationship Reasoning For Visual Question Answering",
BOOKTITLE = ICIP20,
YEAR = "2020",
PAGES = "1411-1415",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803mmovqa5.html#TT234015"}
Last update:Jan 23, 2026 at 20:54:10