Multimodal Algorithmic Reasoning Workshop


Exemplar Masking for Multimodal Incremental Learning
Yi-Lun Lee,
Chen-Yu Lee,
Wei-Chen Chiu,
Yi-Hsuan Tsai
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2025_CVPR, author = {Lee, Yi-Lun and Lee, Chen-Yu and Chiu, Wei-Chen and Tsai, Yi-Hsuan}, title = {Exemplar Masking for Multimodal Incremental Learning}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2942-2951} }

Comparison Visual Instruction Tuning
Wei Lin,
Muhammad Jehanzeb Mirza,
Sivan Doveh,
Rogerio Feris,
Raja Giryes,
Sepp Hochreiter,
Leonid Karlinsky
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2025_CVPR, author = {Lin, Wei and Mirza, Muhammad Jehanzeb and Doveh, Sivan and Feris, Rogerio and Giryes, Raja and Hochreiter, Sepp and Karlinsky, Leonid}, title = {Comparison Visual Instruction Tuning}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2973-2983} }

Human vs. Machine Minds: Ego-Centric Action Recognition Compared
Sadegh Rahmaniboldaji,
Filip Rybansky,
Quoc Vuong,
Frank Guerin,
Andrew Gilbert
[pdf]
[bibtex]
@InProceedings{Rahmaniboldaji_2025_CVPR, author = {Rahmaniboldaji, Sadegh and Rybansky, Filip and Vuong, Quoc and Guerin, Frank and Gilbert, Andrew}, title = {Human vs. Machine Minds: Ego-Centric Action Recognition Compared}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2952-2962} }

SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging
Tan-Hanh Pham,
Trong-Duong Bui,
Minh Luu Quang,
Tan Huong Pham,
Chris Ngo,
Truong Son Hy
[pdf]
[bibtex]
@InProceedings{Pham_2025_CVPR, author = {Pham, Tan-Hanh and Bui, Trong-Duong and Quang, Minh Luu and Pham, Tan Huong and Ngo, Chris and Hy, Truong Son}, title = {SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2984-2994} }

Autonomous Multimodal Reasoning via Implicit Chain-of-Vision
Yiqiao Huang,
Qi He,
Zhaorun Chen,
Haopeng Zhang,
Hanchao Yu,
Zhuokai Zhao
[pdf]
[bibtex]
@InProceedings{Huang_2025_CVPR, author = {Huang, Yiqiao and He, Qi and Chen, Zhaorun and Zhang, Haopeng and Yu, Hanchao and Zhao, Zhuokai}, title = {Autonomous Multimodal Reasoning via Implicit Chain-of-Vision}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2963-2972} }

Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions
Mohammadmostafa Rostamkhani,
Baktash Ansari,
Hoorieh Sabzevari,
Farzan Rahmani,
Sauleh Eetemadi
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rostamkhani_2025_CVPR, author = {Rostamkhani, Mohammadmostafa and Ansari, Baktash and Sabzevari, Hoorieh and Rahmani, Farzan and Eetemadi, Sauleh}, title = {Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2995-3004} }