Multimodal Algorithmic Reasoning Workshop
Exemplar Masking for Multimodal Incremental Learning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lee_2025_CVPR, author = {Lee, Yi-Lun and Lee, Chen-Yu and Chiu, Wei-Chen and Tsai, Yi-Hsuan}, title = {Exemplar Masking for Multimodal Incremental Learning}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2942-2951} }
Comparison Visual Instruction Tuning-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Lin_2025_CVPR, author = {Lin, Wei and Mirza, Muhammad Jehanzeb and Doveh, Sivan and Feris, Rogerio and Giryes, Raja and Hochreiter, Sepp and Karlinsky, Leonid}, title = {Comparison Visual Instruction Tuning}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2973-2983} }
Human vs. Machine Minds: Ego-Centric Action Recognition Compared-
[pdf]
[bibtex]@InProceedings{Rahmaniboldaji_2025_CVPR, author = {Rahmaniboldaji, Sadegh and Rybansky, Filip and Vuong, Quoc and Guerin, Frank and Gilbert, Andrew}, title = {Human vs. Machine Minds: Ego-Centric Action Recognition Compared}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2952-2962} }
SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging-
[pdf]
[bibtex]@InProceedings{Pham_2025_CVPR, author = {Pham, Tan-Hanh and Bui, Trong-Duong and Quang, Minh Luu and Pham, Tan Huong and Ngo, Chris and Hy, Truong Son}, title = {SilVar-Med: A Speech-Driven Visual Language Model for Explainable Abnormality Detection in Medical Imaging}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2984-2994} }
Autonomous Multimodal Reasoning via Implicit Chain-of-Vision-
[pdf]
[bibtex]@InProceedings{Huang_2025_CVPR, author = {Huang, Yiqiao and He, Qi and Chen, Zhaorun and Zhang, Haopeng and Yu, Hanchao and Zhao, Zhuokai}, title = {Autonomous Multimodal Reasoning via Implicit Chain-of-Vision}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2963-2972} }
Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Rostamkhani_2025_CVPR, author = {Rostamkhani, Mohammadmostafa and Ansari, Baktash and Sabzevari, Hoorieh and Rahmani, Farzan and Eetemadi, Sauleh}, title = {Illusory VQA: Benchmarking and Enhancing Multimodal Models on Visual Illusions}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {2995-3004} }