@inproceedings{5dbb7787bad24365855e5ce710c9d57c,
title = "PLMVQA: Applying Pseudo Labels for Medical Visual Question Answering with Limited Data",
abstract = "Different from Visual Question Answering (VQA) in the general domain, Medical VQA is more challenging due to the lack of large-scale labeled datasets. In addition, Medical VQA requires high interpretability when making decisions to answer clinical questions. Thus, it should be clear which visual elements within the medical image such as organs or abnormalities are essential for answering clinical questions. To overcome these challenges, we propose a novel method based on Vision Transformer (ViT), which reformulates Medical VQA as a multi-task learning task. We first construct soft pseudo labels of logits for essential selected visual elements from limited annotation data of the existing Medical VQA dataset. Then, we apply these pseudo labels in our proposed Medical VQA model by predicting the answer and pseudo labels at the same time, which not only improves the performance of the proposed model but also presents better interpretability. Extensive experiments on two Medical VQA datasets demonstrate the effectiveness of our proposed method.",
keywords = "Medical Visual Question Answering, Multi-task Learning, Pseudo Label, Vision Transformer",
author = "Zheng Yu and Yutong Xie and Yong Xia and Qi Wu",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2023.; 26th International Conference on Medical Image Computing and Computer-Assisted Intervention , MICCAI 2023 ; Conference date: 08-10-2023 Through 12-10-2023",
year = "2023",
doi = "10.1007/978-3-031-47425-5\_32",
language = "英语",
isbn = "9783031474248",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "357--367",
editor = "Jonghye Woo and Alessa Hering and Wilson Silva and Xiang Li and Huazhu Fu and Xiaofeng Liu and Fangxu Xing and Sanjay Purushotham and T.S. Mathai and Pritam Mukherjee and \{De Grauw\}, Max and \{Beets Tan\}, Regina and Valentina Corbetta and Elmar Kotter and Mauricio Reyes and C.F. Baumgartner and Quanzheng Li and Richard Leahy and Bin Dong and Hao Chen and Yuankai Huo and Jinglei Lv and Xinxing Xu and Xiaomeng Li and Dwarikanath Mahapatra and Li Cheng and Caroline Petitjean and Beno{\^i}t Presles",
booktitle = "Medical Image Computing and Computer Assisted Intervention – MICCAI 2023 Workshops - MTSAIL 2023, LEAF 2023, AI4Treat 2023, MMMI 2023, REMIA 2023, Held in Conjunction with MICCAI 2023, Proceedings",
}