Unified Robotic Vision with Cross-Modal Sensing and Alignment
GeomPrompt: Geometric Prompt Learning for RGB-D Semantic Segmentation Under Missing and Degraded Depth-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jaganathan_2026_CVPR, author = {Jaganathan, Krishna and Vela, Patricio}, title = {GeomPrompt: Geometric Prompt Learning for RGB-D Semantic Segmentation Under Missing and Degraded Depth}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8268-8278} }
MARVEL: Multimodal Adaptive Reasoning-intensiVe Expand-rerank and retrievaL-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kasem_2026_CVPR, author = {Kasem, Mahmoud SalahEldin and Mahmoud, Mohamed and Senussi, Mostafa Farouk and Abdalla, Mahmoud and Abdallah, Abdelrahman and Kang, Hyun-Soo}, title = {MARVEL: Multimodal Adaptive Reasoning-intensiVe Expand-rerank and retrievaL}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8279-8288} }
Adverse-to-the-eXtreme Panoptic Segmentation: URVIS 2026 Study and Benchmark-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2026_CVPR, author = {Wang, Yiting and Peyratout, Nolwenn and Broedermann, Tim and Wang, Jiahui and Cao, Yusi and Cazzola, Michele and Tarassov, Elie and Kobayashi, Takuya and Kasmi, Abderrahim and Allibert, Guillaume and Demonceaux, C\'edric and Donzella, Valentina and Debattista, Kurt and Timofte, Radu and Wu, Zongwei and Sakaridis, Christos}, title = {Adverse-to-the-eXtreme Panoptic Segmentation: URVIS 2026 Study and Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8346-8354} }
Toward Efficient Visual Gyroscopes: Spherical Moments, Harmonics Filtering, and Masking Techniques for Spherical Camera Applications-
[pdf]
[arXiv]
[bibtex]@InProceedings{Du_2026_CVPR, author = {Du, Yao and Mateo, Carlos and Maras, Mirjana and Wang, Tsun-Hsuan and Blanchon, Marc and Amini, Alexander and Rus, Daniela and Tahri, Omar}, title = {Toward Efficient Visual Gyroscopes: Spherical Moments, Harmonics Filtering, and Masking Techniques for Spherical Camera Applications}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8248-8256} }
Object Tracking in the Real World: URVIS 2026 Study and Benchmark-
[pdf]
[supp]
[bibtex]@InProceedings{Lu_2026_CVPR, author = {Lu, Andong and Ding, Zhaodong and Li, Chenglong and Tang, Jin and Wu, Zongwei and Tan, Yuedong and Timofte, Radu and Hu, Xiantao and Wang, He and Tang, Zhangyong and Xu, Tianyang and Wu, Xiaojun and Tai, Ying and Yang, Jian and Zhu, Yabin and Zhang, Chunhui and Liu, Li and Wen, Hao and Zhou, Xi and Wang, Yanfeng and Wang, Shilei and Du, Yipin and Cheng, Yongkang and Lai, Pujian and Gao, Dong and Cheng, Gong and Xi, Jihuan and Zhou, Yong and Zhou, Jinglin and Zhu, Xuefeng}, title = {Object Tracking in the Real World: URVIS 2026 Study and Benchmark}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8299-8307} }
GBG-SLAM: Key-frame Centered Monocular Gaussian SLAM with Scale Consistent Dense Geometry Boosting-
[pdf]
[supp]
[bibtex]@InProceedings{Fan_2026_CVPR, author = {Fan, Chuanmao and Zhao, Chenxi and Duan, Ye}, title = {GBG-SLAM: Key-frame Centered Monocular Gaussian SLAM with Scale Consistent Dense Geometry Boosting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8257-8267} }
Event-to-Frame Vehicle Re-identification for Heterogeneous Camera Networks: Dataset and Algorithm-
[pdf]
[bibtex]@InProceedings{Menon_2026_CVPR, author = {Menon, Nitesh and McCloskey, Scott}, title = {Event-to-Frame Vehicle Re-identification for Heterogeneous Camera Networks: Dataset and Algorithm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8318-8327} }
SIR: Structured Image Representations for Explainable Robot Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Mattes_2026_CVPR, author = {Mattes, Paul and Schwab, Jan and Bosch, Jens and Blank, Nils and Li, Maximilian Xiling and Tang, Minh-Trung and Haberland, Moritz and Lioutikov, Rudolf}, title = {SIR: Structured Image Representations for Explainable Robot Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8308-8317} }
InfoCalib: Information-Theoretic Collapse Diagnosis and Dynamic Calibration for Robust Multimodal Frequency Fusion-
[pdf]
[bibtex]@InProceedings{Li_2026_CVPR, author = {Li, Shenzhi and Qin, Boao and Wang, Peng and Deng, Rangyu}, title = {InfoCalib: Information-Theoretic Collapse Diagnosis and Dynamic Calibration for Robust Multimodal Frequency Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8289-8298} }
Le MuMo JEPA: Multi-Modal Self-Supervised Representation Learning with Learnable Fusion Tokens-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Cornelissen_2026_CVPR, author = {Cornelissen, Ciem and Leroux, Sam and Simoens, Pieter}, title = {Le MuMo JEPA: Multi-Modal Self-Supervised Representation Learning with Learnable Fusion Tokens}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8238-8247} }
Hear2See: Speech-Driven Visual Reasoning under Linguistic Variability-
[pdf]
[bibtex]@InProceedings{Santos_2026_CVPR, author = {Santos, Joel and Wu, Zongwei and Timofte, Radu}, title = {Hear2See: Speech-Driven Visual Reasoning under Linguistic Variability}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8328-8337} }
DCTrack: Divide-and-Conquer for Modality-Missing RGBT Tracking-
[pdf]
[bibtex]@InProceedings{Wang_2026_CVPR, author = {Wang, Shilei and Du, Yipin and Cheng, Yongkang and Lai, Pujian and Gao, Dong and Cheng, Gong}, title = {DCTrack: Divide-and-Conquer for Modality-Missing RGBT Tracking}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8338-8345} }
Joint Multi-Camera LiDAR Extrinsic Calibration via Learned Pairwise Initialization and Geometric Refinement-
[pdf]
[bibtex]@InProceedings{Al-Najjar_2026_CVPR, author = {Al-Najjar, Aziz and Amini, Marzieh and Green, James R and Kwamena, Felix}, title = {Joint Multi-Camera LiDAR Extrinsic Calibration via Learned Pairwise Initialization and Geometric Refinement}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {8229-8237} }

