@inproceedings{ijcai2025p853, title = {Localizing Before Answering: A Benchmark for Grounded Medical Visual Question Answering}, author = {Nguyen, Dung and Ho, Minh Khoi and Ta, Huy and Nguyen, Thanh Tam and Chen, Qi and Rav, Kumar and Dang, Quy Duong and Ramchandre, Satwik and Phung, Son Lam and Liao, Zhibin and To, Minh-Son and Verjans, Johan and Nguyen, Phi Le and Phan, Vu Minh Hieu}, booktitle = {Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI-25}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {James Kwok}, pages = {7670--7678}, year = {2025}, month = {8}, note = {Main Track}, doi = {10.24963/ijcai.2025/853}, url = {https://doi.org/10.24963/ijcai.2025/853}, }