CVPR 2026 Open Access Repository

Autonomous Understanding Through Open-world Perception and Integrated Language models for On-road Tasks

Probing the Reliability of Driving VLMs: From Inconsistent Responses to Grounded Temporal Reasoning: Chun-Peng Chang,

Chen-Yu Wang,

Holger Caesar,

Alain Pagani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Chang_2026_CVPR, author = {Chang, Chun-Peng and Wang, Chen-Yu and Caesar, Holger and Pagani, Alain}, title = {Probing the Reliability of Driving VLMs: From Inconsistent Responses to Grounded Temporal Reasoning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {644-654} }
ACCIDENT: A Benchmark Dataset for Vehicle Accident Detection from Traffic Surveillance Videos: Lukas Picek,

Michal Čermák,

Marek Hanzl,

Vojtěch Čermák; [pdf] [supp]
[bibtex]
@InProceedings{Picek_2026_CVPR, author = {Picek, Lukas and \v{C}erm\'ak, Michal and Hanzl, Marek and \v{C}erm\'ak, Vojt\v{e}ch}, title = {ACCIDENT: A Benchmark Dataset for Vehicle Accident Detection from Traffic Surveillance Videos}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {685-694} }
Drive Like Humans, Plan Like Machines: An Explicit Sense and Safety Aware Autonomous Driving Framework: Xia Wang,

Ziyan An,

Yuhang Zhang,

Meiyi Ma,

Daniel B. Work,

Jonathan Sprinkle; [pdf] [supp]
[bibtex]
@InProceedings{Wang_2026_CVPR, author = {Wang, Xia and An, Ziyan and Zhang, Yuhang and Ma, Meiyi and Work, Daniel B. and Sprinkle, Jonathan}, title = {Drive Like Humans, Plan Like Machines: An Explicit Sense and Safety Aware Autonomous Driving Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {695-706} }
Spatial-aware Vision Language Model for Autonomous Driving: Weijie Wei,

Zhipeng Luo,

Feng Ling,

Venice Erin Liong; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wei_2026_CVPR, author = {Wei, Weijie and Luo, Zhipeng and Ling, Feng and Liong, Venice Erin}, title = {Spatial-aware Vision Language Model for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {707-717} }
Automingo: Seeing the Unseen - Vision-Language Edge Case Dataset for Detection and Analysis of Autonomous Driving: Vaclav Divis,

Íñigo Barcelo Álvarez,

Alejandro Farinas Nubla,

Enrique Sanchez,

Antonio Hernandez-Ros Briales,

Ondřej Valach,

Ivan Gruber,

Marek Hrúz; [pdf] [supp]
[bibtex]
@InProceedings{Divis_2026_CVPR, author = {Divis, Vaclav and \'Alvarez, \'I\~nigo Barcelo and Nubla, Alejandro Farinas and Sanchez, Enrique and Briales, Antonio Hernandez-Ros and Valach, Ond\v{r}ej and Gruber, Ivan and Hr\'uz, Marek}, title = {Automingo: Seeing the Unseen - Vision-Language Edge Case Dataset for Detection and Analysis of Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {665-674} }
TopoMaskV3: 3D Mask Head with Dense Offset and Height Predictions for Road Topology Understanding: Muhammet Esat Kalfaoglu,

Halil Ibrahim Öztürk,

Ozsel Kilinc,

Alptekin Temizel; [pdf] [supp]
[bibtex]
@InProceedings{Kalfaoglu_2026_CVPR, author = {Kalfaoglu, Muhammet Esat and \"Ozt\"urk, Halil Ibrahim and Kilinc, Ozsel and Temizel, Alptekin}, title = {TopoMaskV3: 3D Mask Head with Dense Offset and Height Predictions for Road Topology Understanding}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {675-684} }
OmniSieve: Query-Guided Adaptive Token Allocation for Efficient Multi-View Vision-Language Reasoning: Preetam Chhimpa,

Indrajit Ghosh; [pdf]
[bibtex]
@InProceedings{Chhimpa_2026_CVPR, author = {Chhimpa, Preetam and Ghosh, Indrajit}, title = {OmniSieve: Query-Guided Adaptive Token Allocation for Efficient Multi-View Vision-Language Reasoning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {655-664} }