@inproceedings{bb239700,
AUTHOR = "Wang, H.B. and Ge, W.F.",
TITLE = "Q&A Prompts: Discovering Rich Visual Clues through Mining
Question-answer Prompts for VQA requiring Diverse World Knowledge",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLII: 274-292",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234616"}
@inproceedings{bb239701,
AUTHOR = "Liu, H. and Ma, X. and Zhong, C. and Zhang, Y. and Lin, W.Y.",
TITLE = "Timecraft: Navigate Weakly-supervised Temporal Grounded Video Question
Answering via Bi-directional Reasoning",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "V: 92-107",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234617"}
@inproceedings{bb239702,
AUTHOR = "Zhang, Y.F. and Jiang, M. and Zhao, Q.",
TITLE = "Grace: Graph-based Contextual Debiasing for Fair Visual Question
Answering",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XVII: 176-194",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234618"}
@inproceedings{bb239703,
AUTHOR = "Liu, X.L. and Dong, Z.K. and Zhang, P.",
TITLE = "Tackling Data Bias in MUSIC-AVQA: Crafting a Balanced Dataset for
Unbiased Question-Answering",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "4466-4475",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234619"}
@inproceedings{bb239704,
AUTHOR = "Shi, X.X. and Lee, S.",
TITLE = "Benchmarking Out-of-Distribution Detection in Visual Question
Answering",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "5473-5483",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234620"}
@inproceedings{bb239705,
AUTHOR = "Venkataraman, S.R. and Rao, R.S. and Balasubramanian, S. and Sarma, R.R. and Vorugunti, C.S.",
TITLE = "Can you even tell left from right? Presenting a new challenge for VQA",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "4486-4495",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234621"}
@inproceedings{bb239706,
AUTHOR = "Sahu, P.P. and Raut, A. and Samant, J.S. and Gorijala, M. and Lakshminarayanan, V. and Bhaskar, P.",
TITLE = "POP-VQA: Privacy preserving, On-device, Personalized Visual Question
Answering",
BOOKTITLE = WACV24,
YEAR = "2024",
PAGES = "8455-8464",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234622"}
@inproceedings{bb239707,
AUTHOR = "Li, J.P. and Wei, P. and Han, W.J. and Fan, L.F.",
TITLE = "IntentQA: Context-aware Video Intent Reasoning",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "11929-11940",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234623"}
@inproceedings{bb239708,
AUTHOR = "Hu, Y.S. and Hua, H. and Yang, Z.Y. and Shi, W.J. and Smith, N.A. and Luo, J.B.",
TITLE = "PromptCap: Prompt-Guided Image Captioning for VQA with GPT-3",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "2951-2963",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234624"}
@inproceedings{bb239709,
AUTHOR = "Naik, N. and Potts, C. and Kreiss, E.",
TITLE = "Context-VQA: Towards Context-Aware and Purposeful Visual Question
Answering",
BOOKTITLE = CLVL23,
YEAR = "2023",
PAGES = "2813-2817",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234625"}
@inproceedings{bb239710,
AUTHOR = "Hu, Y.S. and Liu, B. and Kasai, J. and Wang, Y.Z. and Ostendorf, M. and Krishna, R. and Smith, N.A.",
TITLE = "TIFA: Accurate and Interpretable Text-to-Image Faithfulness
Evaluation with Question Answering",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "20349-20360",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234626"}
@inproceedings{bb239711,
AUTHOR = "Zhang, Y.W. and Ho, C.H. and Vasconcelos, N.M.",
TITLE = "Toward Unsupervised Realistic Visual Question Answering",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "15567-15578",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234627"}
@inproceedings{bb239712,
AUTHOR = "Liang, K. and Albanie, S.",
TITLE = "Simple Baselines for Interactive Video Retrieval with Questions and
Answers",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "11057-11067",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234628"}
@inproceedings{bb239713,
AUTHOR = "Mensink, T. and Uijlings, J. and Castrejon, L. and Goel, A. and Cadar, F. and Zhou, H. and Sha, F. and Araujo, A. and Ferrari, V.",
TITLE = "Encyclopedic VQA: Visual questions about detailed properties of
fine-grained categories",
BOOKTITLE = ICCV23,
YEAR = "2023",
PAGES = "3090-3101",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234629"}
@inproceedings{bb239714,
AUTHOR = "Bruni, P. and Falcon, A. and Radeva, P.",
TITLE = "Time-aware Circulant Matrices for Question-based Temporal Localization",
BOOKTITLE = CIAP23,
YEAR = "2023",
PAGES = "II:182-195",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234630"}
@inproceedings{bb239715,
AUTHOR = "Ferreira, B.C.L. and Oliveira, H.G. and Silva, C.",
TITLE = "Leveraging Question Answering for Domain-Agnostic Information
Extraction",
BOOKTITLE = CIARP23,
YEAR = "2023",
PAGES = "I:244-256",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234631"}
@inproceedings{bb239716,
AUTHOR = "Wu, Z.H. and Shu, X.Y. and Yan, S.Y. and Lu, Z.Y.",
TITLE = "FGCVQA: Fine-Grained Cross-Attention for Medical VQA",
BOOKTITLE = ICIP23,
YEAR = "2023",
PAGES = "975-979",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234632"}
@inproceedings{bb239717,
AUTHOR = "Zhu, H. and Togo, R. and Ogawa, T. and Haseyama, M.",
TITLE = "Interpretable Visual Question Answering Referring to Outside
Knowledge",
BOOKTITLE = ICIP23,
YEAR = "2023",
PAGES = "2140-2144",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234633"}
@inproceedings{bb239718,
AUTHOR = "Parelli, M. and Mallis, D. and Diomataris, M. and Pitsikalis, V.",
TITLE = "Interpretable Visual Question Answering Via Reasoning Supervision",
BOOKTITLE = ICIP23,
YEAR = "2023",
PAGES = "2525-2529",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234634"}
@inproceedings{bb239719,
AUTHOR = "Hegde, S. and Jahagirdar, S. and Gangisetty, S.",
TITLE = "Making the V in Text-VQA Matter",
BOOKTITLE = ODRUM23,
YEAR = "2023",
PAGES = "5580-5588",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234635"}
@inproceedings{bb239720,
AUTHOR = "Suo, W. and Sun, M.Y. and Liu, W.S. and Gao, Y.Q. and Wang, P. and Zhang, Y.N. and Wu, Q.",
TITLE = "S3C: Semi-Supervised VQA Natural Language Explanation via
Self-Critical Learning",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "2646-2656",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234636"}
@inproceedings{bb239721,
AUTHOR = "Alampalle, C. and Hegde, S. and Jahagirdar, S. and Gangisetty, S.",
TITLE = "Weakly Supervised Visual Question Answer Generation",
BOOKTITLE = ODRUM23,
YEAR = "2023",
PAGES = "5589-5597",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234637"}
@inproceedings{bb239722,
AUTHOR = "Jiang, J.J. and Zheng, N.N.",
TITLE = "MixPHM: Redundancy-Aware Parameter-Efficient Tuning for Low-Resource
Visual Question Answering",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "24203-24213",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234638"}
@inproceedings{bb239723,
AUTHOR = "Wang, Y. and Pfeiffer, J. and Carion, N. and Le Cun, Y.L. and Kamath, A.",
TITLE = "Adapting Grounded Visual Question Answering Models to Low Resource
Languages",
BOOKTITLE = MULA23,
YEAR = "2023",
PAGES = "2596-2605",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234639"}
@inproceedings{bb239724,
AUTHOR = "Wang, M. and Mahjoubfar, A. and Joshi, A.",
TITLE = "FashionVQA: A Domain-Specific Visual Question Answering System",
BOOKTITLE = CVFAD23,
YEAR = "2023",
PAGES = "3514-3519",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234640"}
@inproceedings{bb239725,
AUTHOR = "Tascon Morales, S. and Marquez Neila, P. and Sznitman, R.",
TITLE = "Logical Implications for Visual Question Answering Consistency",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "6725-6735",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234641"}
@inproceedings{bb239726,
AUTHOR = "Chen, S. and Zhao, Q.",
TITLE = "Divide and Conquer: Answering Questions with Object Factorization and
Compositional Reasoning",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "6736-6745",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234642"}
@inproceedings{bb239727,
AUTHOR = "Basu, A. and Addepalli, S. and Babu, R.V.",
TITLE = "RMLVQA: A Margin Loss Approach For Visual Question Answering with
Language Biases",
BOOKTITLE = CVPR23,
YEAR = "2023",
PAGES = "11671-11680",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234643"}
@inproceedings{bb239728,
AUTHOR = "Vivoli, E. and Biten, A.F. and Mafla, A. and Karatzas, D. and Gomez, L.",
TITLE = "MUST-VQA: Multilingual Scene-Text VQA",
BOOKTITLE = TextEvery22,
YEAR = "2022",
PAGES = "345-358",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234644"}
@inproceedings{bb239729,
AUTHOR = "Bongini, P. and Becattini, F. and del Bimbo, A.",
TITLE = "Is GPT-3 All You Need for Visual Question Answering in Cultural
Heritage?",
BOOKTITLE = VisArt22,
YEAR = "2022",
PAGES = "268-281",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234645"}
@inproceedings{bb239730,
AUTHOR = "Jha, A. and Patro, B. and Van Gool, L.J. and Tuytelaars, T.",
TITLE = "Barlow constrained optimization for Visual Question Answering",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "1084-1093",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234646"}
@inproceedings{bb239731,
AUTHOR = "Ravi, S. and Chinchure, A. and Sigal, L. and Liao, R.J. and Shwartz, V.",
TITLE = "VLC-BERT: Visual Question Answering with Contextualized Commonsense
Knowledge",
BOOKTITLE = WACV23,
YEAR = "2023",
PAGES = "1155-1165",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234647"}
@inproceedings{bb239732,
AUTHOR = "Etesam, Y. and Kochiev, L. and Chang, A.X.",
TITLE = "3DVQA: Visual Question Answering for 3D Environments",
BOOKTITLE = CRV22,
YEAR = "2022",
PAGES = "233-240",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234648"}
@inproceedings{bb239733,
AUTHOR = "Ramamurthy, P. and Aakur, S.N.",
TITLE = "ISD-QA: Iterative Distillation of Commonsense Knowledge from General
Language Models for Unsupervised Question Answering",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "1229-1235",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234649"}
@inproceedings{bb239734,
AUTHOR = "Liu, L. and Su, X.D. and Guo, H. and Zhu, D.",
TITLE = "A Transformer-based Medical Visual Question Answering Model",
BOOKTITLE = "ICPR22",
YEAR = "2022",
PAGES = "1712-1718",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234650"}
@inproceedings{bb239735,
AUTHOR = "Wu, X.Y. and Lu, J.F. and Li, Z.F. and Xiong, F.C.",
TITLE = "Ques-to-Visual Guided Visual Question Answering",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "4193-4197",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234651"}
@inproceedings{bb239736,
AUTHOR = "Sarkar, A. and Rahnemoonfar, M.",
TITLE = "Grad-Cam Aware Supervised Attention for Visual Question Answering for
Post-Disaster Damage Assessment",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "3783-3787",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234652"}
@inproceedings{bb239737,
AUTHOR = "Whitehead, S. and Petryk, S. and Shakib, V. and Gonzalez, J. and Darrell, T.J. and Rohrbach, A. and Rohrbach, M.",
TITLE = "Reliable Visual Question Answering: Abstain Rather Than Answer
Incorrectly",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XXXVI:148-166",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234653"}
@inproceedings{bb239738,
AUTHOR = "Chen, L. and Zheng, Y.H. and Xiao, J.",
TITLE = "Rethinking Data Augmentation for Robust Visual Question Answering",
BOOKTITLE = ECCV22,
YEAR = "2022",
PAGES = "XXXVI:95-112",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234654"}
@inproceedings{bb239739,
AUTHOR = "Zhang, H.T. and Wu, W.",
TITLE = "Context Relation Fusion Model for Visual Question Answering",
BOOKTITLE = ICIP22,
YEAR = "2022",
PAGES = "2112-2116",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234655"}
@inproceedings{bb239740,
AUTHOR = "Biten, A.F. and Litman, R. and Xie, Y.S. and Appalaraju, S. and Manmatha, R.",
TITLE = "LaTr: Layout-Aware Transformer for Scene-Text VQA",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "16527-16537",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234656"}
@inproceedings{bb239741,
AUTHOR = "Lu, J.Y. and Ye, X. and Ren, Y. and Yang, Y.Z.",
TITLE = "Good, Better, Best: Textual Distractors Generation for
Multiple-Choice Visual Question Answering via Reinforcement Learning",
BOOKTITLE = ODRUM22,
YEAR = "2022",
PAGES = "4917-4926",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234657"}
@inproceedings{bb239742,
AUTHOR = "Ding, Y.H. and Huang, Z. and Wang, R. and Zhang, Y.H. and Chen, X. and Ma, Y.Z. and Chung, H. and Han, S.C.",
TITLE = "V-Doc: Visual questions answers with Documents",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "21460-21466",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234658"}
@inproceedings{bb239743,
AUTHOR = "Azuma, D. and Miyanishi, T. and Kurita, S.H. and Kawanabe, M.",
TITLE = "ScanQA: 3D Question Answering for Spatial Scene Understanding",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "19107-19117",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234659"}
@inproceedings{bb239744,
AUTHOR = "Li, G.Y. and Wei, Y. and Tian, Y.P. and Xu, C.L. and Wen, J.R. and Hu, D.",
TITLE = "Learning to Answer Questions in Dynamic Audio-Visual Scenarios",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "19086-19096",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234660"}
@inproceedings{bb239745,
AUTHOR = "Chen, C.Y. and Anjum, S. and Gurari, D.",
TITLE = "Grounding Answers for Visual Questions Asked by Visually Impaired
People",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "19076-19085",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234661"}
@inproceedings{bb239746,
AUTHOR = "Li, C.H. and Li, Z. and Jing, C.C. and Wu, Y.W. and Zhai, M.L. and Jia, Y.D.",
TITLE = "Compositional Substitutivity of Visual Reasoning for Visual Question
Answering",
BOOKTITLE = ECCV24,
YEAR = "2024",
PAGES = "XLVIII: 143-160",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234662"}
@inproceedings{bb239747,
AUTHOR = "Jing, C.C. and Jia, Y.D. and Wu, Y.W. and Liu, X.Y. and Wu, Q.",
TITLE = "Maintaining Reasoning Consistency in Compositional Visual Question
Answering",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "5089-5098",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234663"}
@inproceedings{bb239748,
AUTHOR = "Cascante Bonilla, P. and Wu, H. and Wang, L. and Feris, R.S. and Ordonez, V.",
TITLE = "Sim VQA: Exploring Simulated Environments for Visual Question
Answering",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "5046-5056",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234664"}
@inproceedings{bb239749,
AUTHOR = "Gupta, V. and Li, Z.W. and Kortylewski, A. and Zhang, C.Y. and Li, Y.W. and Yuille, A.L.",
TITLE = "SwapMix: Diagnosing and Regularizing the Over-Reliance on Visual
Context in Visual Question Answering",
BOOKTITLE = CVPR22,
YEAR = "2022",
PAGES = "5068-5078",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234665"}
@inproceedings{bb239750,
AUTHOR = "Burghouts, G.J. and Huizinga, W.",
TITLE = "Coarse-to-Fine Visual Question Answering by Iterative, Conditional
Refinement",
BOOKTITLE = CIAP22,
YEAR = "2022",
PAGES = "II:418-428",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234666"}
@inproceedings{bb239751,
AUTHOR = "Kant, Y. and Moudgil, A. and Batra, D. and Parikh, D. and Agrawal, H.",
TITLE = "Contrast and Classify: Training Robust VQA Models",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "1584-1593",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234667"}
@inproceedings{bb239752,
AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Huang, Q.M. and Tian, Q.",
TITLE = "Greedy Gradient Ensemble for Robust Visual Question Answering",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "1564-1573",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234668"}
@inproceedings{bb239753,
AUTHOR = "Zhou, Y.Y. and Ren, T.H. and Zhu, C.Y. and Sun, X.S. and Liu, J.Z. and Ding, X.H. and Xu, M.L. and Ji, R.R.",
TITLE = "TRAR: Routing the Attention Spans in Transformer for Visual Question
Answering",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "2054-2064",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234669"}
@inproceedings{bb239754,
AUTHOR = "Yang, X. and Gao, C.Y. and Zhang, H.W. and Cai, J.F.",
TITLE = "Auto-Parsing Network for Image Captioning and Visual Question
Answering",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "2177-2187",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234670"}
@inproceedings{bb239755,
AUTHOR = "Banerjee, P. and Gokhale, T. and Yang, Y.Z. and Baral, C.",
TITLE = "Weakly Supervised Relative Spatial Reasoning for Visual Question
Answering",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "1888-1898",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234671"}
@inproceedings{bb239756,
AUTHOR = "Li, L.J. and Lei, J. and Gan, Z. and Liu, J.J.",
TITLE = "Adversarial VQA:
A New Benchmark for Evaluating the Robustness of VQA Models",
BOOKTITLE = ICCV21,
YEAR = "2021",
PAGES = "2022-2031",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234672"}
@inproceedings{bb239757,
AUTHOR = "Askarian, N. and Abbasnejad, E. and Zukerman, I. and Buntine, W. and Haffari, G.",
TITLE = "Inductive Biases for Low Data VQA: A Data Augmentation Approach",
BOOKTITLE = Novelty22,
YEAR = "2022",
PAGES = "231-240",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234673"}
@inproceedings{bb239758,
AUTHOR = "Mathew, M. and Bagal, V. and Tito, R. and Karatzas, D. and Valveny, E. and Jawahar, C.V.",
TITLE = "InfographicVQA",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2582-2591",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234674"}
@inproceedings{bb239759,
AUTHOR = "Kumar, S. and Patro, B.N. and Namboodiri, V.P.",
TITLE = "Auto QA: The Question Is Not Only What, but Also Where",
BOOKTITLE = Novelty22,
YEAR = "2022",
PAGES = "272-281",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234675"}
@inproceedings{bb239760,
AUTHOR = "Kolling, C. and More, M. and Gavenski, N. and Pooch, E. and Parraga, O. and Barros, R.C.",
TITLE = "Efficient Counterfactual Debiasing for Visual Question Answering",
BOOKTITLE = WACV22,
YEAR = "2022",
PAGES = "2572-2581",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234676"}
@inproceedings{bb239761,
AUTHOR = "Jung, S.J. and Byun, J.Y. and Shim, K. and Hwang, S.Y. and Kim, C.",
TITLE = "Understanding VQA for Negative Answers Through Visual and Linguistic
Inference",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2873-2877",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234677"}
@inproceedings{bb239762,
AUTHOR = "Le, T. and Nguyen, H.T. and Nguyen, M.L.",
TITLE = "Vision and Text Transformer for Predicting Answerability on Visual
Question Answering",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "934-938",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234678"}
@inproceedings{bb239763,
AUTHOR = "Huang, Z.Q. and Zhu, H.Y. and Sun, Y. and Choi, D. and Tan, C. and Lim, J.H.",
TITLE = "A Diagnostic Study of Visual Question Answering With Analogical
Reasoning",
BOOKTITLE = ICIP21,
YEAR = "2021",
PAGES = "2463-2467",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234679"}
@inproceedings{bb239764,
AUTHOR = "Wang, Z.X. and Miao, Y. and Specia, L.",
TITLE = "Latent Variable Models for Visual Question Answering",
BOOKTITLE = CLVL21,
YEAR = "2021",
PAGES = "3137-3141",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234680"}
@inproceedings{bb239765,
AUTHOR = "Hirota, Y. and Garcia, N. and Otani, M. and Chu, C. and Nakashima, Y. and Taniguchi, I. and Onoye, T.",
TITLE = "Visual Question Answering with Textual Representations for Images",
BOOKTITLE = CLVL21,
YEAR = "2021",
PAGES = "3147-3150",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234681"}
@inproceedings{bb239766,
AUTHOR = "Ye, K. and Kovashka, A.",
TITLE = "Linguistic Structures as Weak Supervision for Visual Scene Graph
Generation",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "8285-8295",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234682"}
@inproceedings{bb239767,
AUTHOR = "Xiao, J.B. and Shang, X. and Yao, A. and Chua, T.S.",
TITLE = "NExT-QA: Next Phase of Question-Answering to Explaining Temporal
Actions",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "9772-9781",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234683"}
@inproceedings{bb239768,
AUTHOR = "Chen, X.Y. and Jiang, M. and Zhao, Q.",
TITLE = "Predicting Human Scanpaths in Visual Question Answering",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "10871-10880",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234684"}
@inproceedings{bb239769,
AUTHOR = "Qi, Y.G. and Zhang, K. and Sain, A. and Song, Y.Z.",
TITLE = "PQA: Perceptual Question Answering",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "12051-12059",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234685"}
@inproceedings{bb239770,
AUTHOR = "Yuan, Y.Y. and Wang, S. and Jiang, M.Y. and Chen, T.Y.",
TITLE = "Perception Matters: Detecting Perception Failures of VQA Models Using
Metamorphic Testing",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "16903-16912",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234686"}
@inproceedings{bb239771,
AUTHOR = "Marino, K. and Chen, X.L. and Parikh, D. and Gupta, A. and Rohrbach, M.",
TITLE = "KRISP: Integrating Implicit and Symbolic Knowledge for Open-Domain
Knowledge-Based VQA",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "14106-14116",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234687"}
@inproceedings{bb239772,
AUTHOR = "Niu, Y. and Tang, K. and Zhang, H.W. and Lu, Z.W. and Hua, X.S. and Wen, J.R.",
TITLE = "Counterfactual VQA: A Cause-Effect Look at Language Bias",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "12695-12705",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234688"}
@inproceedings{bb239773,
AUTHOR = "Yang, Z.Y. and Lu, Y.J. and Wang, J.F. and Yin, X. and Florencio, D. and Wang, L.J. and Zhang, C. and Zhang, L. and Luo, J.B.",
TITLE = "TAP: Text-Aware Pre-training for Text-VQA and Text-Caption",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "8747-8757",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234689"}
@inproceedings{bb239774,
AUTHOR = "Kervadec, C. and Jaunet, T. and Antipov, G. and Baccouche, M. and Vuillemot, R. and Wolf, C.",
TITLE = "How Transferable are Reasoning Patterns in VQA?",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "4205-4214",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234690"}
@inproceedings{bb239775,
AUTHOR = "Kervadec, C. and Antipov, G. and Baccouche, M. and Wolf, C.",
TITLE = "Roses are Red, Violets are Blue… But Should VQA expect Them To?",
BOOKTITLE = CVPR21,
YEAR = "2021",
PAGES = "2775-2784",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234691"}
@inproceedings{bb239776,
AUTHOR = "Dua, R. and Kancheti, S.S. and Balasubramanian, V.N.",
TITLE = "Beyond VQA: Generating Multi-word Answers and Rationales to Visual
Questions",
BOOKTITLE = MULA21,
YEAR = "2021",
PAGES = "1623-1632",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234692"}
@inproceedings{bb239777,
AUTHOR = "Rahman, T. and Chou, S.H. and Sigal, L. and Carenini, G.",
TITLE = "An Improved Attention for Visual Question Answering",
BOOKTITLE = MULA21,
YEAR = "2021",
PAGES = "1653-1662",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234693"}
@inproceedings{bb239778,
AUTHOR = "Jolly, S. and Palacio, S. and Folz, J. and Raue, F. and Hees, J. and Dengel, A.",
TITLE = "P ˜ NP, at least in Visual Question Answering",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "2748-2754",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234694"}
@inproceedings{bb239779,
AUTHOR = "Mishra, A. and Anand, A. and Guha, P.",
TITLE = "Multi-stage Attention based Visual Question Answering",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "9407-9414",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234695"}
@inproceedings{bb239780,
AUTHOR = "Bozinis, T. and Passalis, N. and Tefas, A.",
TITLE = "Improving Visual Question Answering using Active Perception on Static
Images",
BOOKTITLE = ICPR21,
YEAR = "2021",
PAGES = "879-884",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234696"}
@inproceedings{bb239781,
AUTHOR = "Sun, Q. and Xie, B.H. and Fu, Y.W.",
TITLE = "Second Order Enhanced Multi-Glimpse Attention in Visual Question
Answering",
BOOKTITLE = ACCV20,
YEAR = "2020",
PAGES = "IV:87-103",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234697"}
@inproceedings{bb239782,
AUTHOR = "Goel, V. and Chandak, M. and Anand, A. and Guha, P.",
TITLE = "IQ-VQA: Intelligent Visual Question Answering",
BOOKTITLE = VTIUR20,
YEAR = "2020",
PAGES = "357-370",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234698"}
@inproceedings{bb239783,
AUTHOR = "Qiao, Y. and Yu, Z. and Liu, J.",
TITLE = "VC-VQA: Visual Calibration Mechanism For Visual Question Answering",
BOOKTITLE = ICIP20,
YEAR = "2020",
PAGES = "1481-1485",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234699"}
@inproceedings{bb239784,
AUTHOR = "Tang, R.X. and Ma, C. and Zhang, W.E. and Wu, Q. and Yang, X.K.",
TITLE = "Semantic Equivalent Adversarial Data Augmentation for Visual Question
Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XIX:437-453",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234700"}
@inproceedings{bb239785,
AUTHOR = "Gokhale, T. and Banerjee, P. and Baral, C. and Yang, Y.Z.",
TITLE = "VQA-LOL: Visual Question Answering Under the Lens of Logic",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:379-396",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234701"}
@inproceedings{bb239786,
AUTHOR = "Yang, X.F. and Lin, G.S. and Lv, F.M. and Liu, F.Y.",
TITLE = "TRRNET:
Tiered Relation Reasoning for Compositional Visual Question Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:414-430",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234702"}
@inproceedings{bb239787,
AUTHOR = "Bansal, A. and Zhang, Y. and Chellappa, R.",
TITLE = "Visual Question Answering on Image Sets",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "XXI:51-67",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234703"}
@inproceedings{bb239788,
AUTHOR = "Han, X.Z. and Wang, S.H. and Su, C. and Zhang, W.G. and Huang, Q.M. and Tian, Q.",
TITLE = "Interpretable Visual Reasoning via Probabilistic Formulation Under
Natural Supervision",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "IX:553-570",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234704"}
@inproceedings{bb239789,
AUTHOR = "Li, Q. and Huang, S.Y. and Hong, Y. and Zhu, S.C.",
TITLE = "A Competence-aware Curriculum for Visual Concepts Learning via Question
Answering",
BOOKTITLE = ECCV20,
YEAR = "2020",
PAGES = "II:141-157",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234705"}
@inproceedings{bb239790,
AUTHOR = "Bajaj, G. and Bandyopadhyay, B. and Schmidt, D. and Maneriker, P. and Myers, C. and Parthasarathy, S.",
TITLE = "Understanding Knowledge Gaps in Visual Question Answering:
Implications for Gap Identification and Testing",
BOOKTITLE = MVM20,
YEAR = "2020",
PAGES = "1563-1566",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234706"}
@inproceedings{bb239791,
AUTHOR = "Vatashsky, B. and Ullman, S.",
TITLE = "VQA With No Questions-Answers Training",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10373-10383",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234707"}
@inproceedings{bb239792,
AUTHOR = "Jiang, H. and Misra, I. and Rohrbach, M. and Learned Miller, E.G. and Chen, X.",
TITLE = "In Defense of Grid Features for Visual Question Answering",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10264-10273",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234708"}
@inproceedings{bb239793,
AUTHOR = "Wang, X. and Liu, Y. and Shen, C. and Ng, C.C. and Luo, C. and Jin, L. and Chan, C.S. and van den Hengel, A. and Wang, L.",
TITLE = "On the General Value of Evidence, and Bilingual Scene-Text Visual
Question Answering",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10123-10132",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234709"}
@inproceedings{bb239794,
AUTHOR = "Xiong, P. and Wu, Y.",
TITLE = "TA-Student VQA: Multi-Agents Training by Self-Questioning",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "10062-10072",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234710"}
@inproceedings{bb239795,
AUTHOR = "Agarwal, V. and Shetty, R. and Fritz, M.",
TITLE = "Towards Causal VQA: Revealing and Reducing Spurious Correlations by
Invariant and Covariant Semantic Editing",
BOOKTITLE = CVPR20,
YEAR = "2020",
PAGES = "9687-9695",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234711"}
@inproceedings{bb239796,
AUTHOR = "Kafle, K. and Shrestha, R. and Price, B. and Cohen, S. and Kanan, C.",
TITLE = "Answering Questions about Data Visualizations using Efficient Bimodal
Fusion",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1487-1496",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234712"}
@inproceedings{bb239797,
AUTHOR = "Patro, B.N. and Patel, S. and Namboodiri, V.P.",
TITLE = "Robust Explanations for Visual Question Answering",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1566-1575",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234713"}
@inproceedings{bb239798,
AUTHOR = "Chou, S. and Chao, W. and Lai, W. and Sun, M. and Yang, M.",
TITLE = "Visual Question Answering on 360° Images",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "1596-1605",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234714"}
@inproceedings{bb239799,
AUTHOR = "Chaudhry, R. and Shekhar, S. and Gupta, U. and Maneriker, P. and Bansal, P. and Joshi, A.",
TITLE = "LEAF-QA: Locate, Encode Attend for Figure Question Answering",
BOOKTITLE = WACV20,
YEAR = "2020",
PAGES = "3501-3510",
BIBSOURCE = "http://www.visionbib.com/bibliography/applicat803vqa1.html#TT234715"}
Last update:Feb 26, 2026 at 10:58:24