Workshop on Any-to-any Multimodal Learning
Neural Surface Reconstruction from Sparse Views Using Epipolar Geometry-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chang_2026_CVPR, author = {Chang, Xinhai and Zhou, Kaichen}, title = {Neural Surface Reconstruction from Sparse Views Using Epipolar Geometry}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7607-7617} }
VeRVE: Versatile Retrieval for Videos via Unified Embeddings-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Halbe_2026_CVPR, author = {Halbe, Shaunak and Puranik, Bhagyashree and Unnikrishnan, Jayakrishnan and Thakkar, Kushan and Bhat, Vimal and Parag, Toufiq}, title = {VeRVE: Versatile Retrieval for Videos via Unified Embeddings}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7624-7633} }
On The Application of Linear Attention in Multimodal Transformers-
[pdf]
[arXiv]
[bibtex]@InProceedings{Gerami_2026_CVPR, author = {Gerami, Armin and Madani, Seyedehanita and Duraiswami, Ramani}, title = {On The Application of Linear Attention in Multimodal Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7618-7623} }
Purify-then-Align: Towards Robust Human Sensing under Modality Missing with Knowledge Distillation from Noisy Multimodal Teacher-
[pdf]
[arXiv]
[bibtex]@InProceedings{Weng_2026_CVPR, author = {Weng, Pengcheng and Qian, Yanyu and Xu, Yangxin and Wang, Fei}, title = {Purify-then-Align: Towards Robust Human Sensing under Modality Missing with Knowledge Distillation from Noisy Multimodal Teacher}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7634-7643} }
Beyond Vision: Holistic World Models-
[pdf]
[bibtex]@InProceedings{Yang_2026_CVPR, author = {Yang, Qianwen and Kang, Yanni and Ren, Guangkai and Yang, Qingwen and Li, Nan}, title = {Beyond Vision: Holistic World Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7654-7662} }
CODA-Mask: Contrastive and Adaptive Mask Aware Open-set Semantic Segmentation-
[pdf]
[bibtex]@InProceedings{Zhang_2026_CVPR, author = {Zhang, Keying and Zhao, Jiguang}, title = {CODA-Mask: Contrastive and Adaptive Mask Aware Open-set Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7663-7672} }
Multimodal ELBO with Diffusion Decoders-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wesego_2026_CVPR, author = {Wesego, Daniel and Rooshenas, Pedram}, title = {Multimodal ELBO with Diffusion Decoders}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {7644-7653} }

