CVPR 2025 Open Access Repository

Multimodal Algorithmic Reasoning Workshop

Exemplar Masking for Multimodal Incremental Learning: Yi-Lun Lee,

Chen-Yu Lee,

Wei-Chen Chiu,

Yi-Hsuan Tsai; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lee_2025_CVPR, author = {Lee, Yi-Lun and Lee, Chen-Yu and Chiu, Wei-Chen and Tsai, Yi-Hsuan}, title = {Exemplar Masking for Multimodal Incremental Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2967-2976} }
Comparison Visual Instruction Tuning: Wei Lin,

Muhammad Jehanzeb Mirza,

Sivan Doveh,

Rogerio Feris,

Raja Giryes,

Sepp Hochreiter,

Leonid Karlinsky; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Lin_2025_CVPR, author = {Lin, Wei and Mirza, Muhammad Jehanzeb and Doveh, Sivan and Feris, Rogerio and Giryes, Raja and Hochreiter, Sepp and Karlinsky, Leonid}, title = {Comparison Visual Instruction Tuning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2998-3008} }
Human vs. Machine Minds: Ego-Centric Action Recognition Compared: Sadegh Rahmaniboldaji,

Filip Rybansky,

Quoc Vuong,

Frank Guerin,

Andrew Gilbert; [pdf]
[bibtex]
@InProceedings{Rahmaniboldaji_2025_CVPR, author = {Rahmaniboldaji, Sadegh and Rybansky, Filip and Vuong, Quoc and Guerin, Frank and Gilbert, Andrew}, title = {Human vs. Machine Minds: Ego-Centric Action Recognition Compared}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2977-2987} }
SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging: Tan-Hanh Pham,

Trong-Duong Bui,

Minh Luu Quang,

Tan Huong Pham,

Chris Ngo,

Truong Son Hy; [pdf] [arXiv]
[bibtex]
@InProceedings{Pham_2025_CVPR, author = {Pham, Tan-Hanh and Bui, Trong-Duong and Quang, Minh Luu and Pham, Tan Huong and Ngo, Chris and Hy, Truong Son}, title = {SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {3009-3019} }
Autonomous Multimodal Reasoning via Implicit Chain-of-Vision: Yiqiao Huang,

Qi He,

Zhaorun Chen,

Haopeng Zhang,

Hanchao Yu,

Zhuokai Zhao; [pdf]
[bibtex]
@InProceedings{Huang_2025_CVPR, author = {Huang, Yiqiao and He, Qi and Chen, Zhaorun and Zhang, Haopeng and Yu, Hanchao and Zhao, Zhuokai}, title = {Autonomous Multimodal Reasoning via Implicit Chain-of-Vision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2988-2997} }
Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions: Mohammadmostafa Rostamkhani,

Baktash Ansari,

Hoorieh Sabzevari,

Farzan Rahmani,

Sauleh Eetemadi; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rostamkhani_2025_CVPR, author = {Rostamkhani, Mohammadmostafa and Ansari, Baktash and Sabzevari, Hoorieh and Rahmani, Farzan and Eetemadi, Sauleh}, title = {Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2025}, pages = {3020-3029} }