Workshop on Distillation of Foundation Models for Autonomous Driving
Cross-Camera Module Training of Raw Sensor Data-Based Automotive Machine Vision: Challenges and Solutions-
[pdf]
[supp]
[bibtex]@InProceedings{Kian_2025_ICCV, author = {Kian, Setareh and Brooks-Lehnert, Shannon and Hirakawa, Keigo}, title = {Cross-Camera Module Training of Raw Sensor Data-Based Automotive Machine Vision: Challenges and Solutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4537-4546} }
NuScenes-SpatialQA: A Spatial Understanding and Reasoning Benchmark for Vision-Language Models in Autonomous Driving-
[pdf]
[supp]
[bibtex]@InProceedings{Tian_2025_ICCV, author = {Tian, Kexin and Mao, Jingrui and Zhang, Yunlong and Jiang, Jiwan and Zhou, Yang and Tu, Zhengzhong}, title = {NuScenes-SpatialQA: A Spatial Understanding and Reasoning Benchmark for Vision-Language Models in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4567-4576} }
A Survey on Vision-Language-Action Models for Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Jiang_2025_ICCV, author = {Jiang, Sicong and Huang, Zilin and Qian, Kangan and Luo, Ziang and Zhu, Tianze and Zhong, Yang and Tang, Yihong and Kong, Menglin and Wang, Yunlong and Jiao, Siwen and Ye, Hao and Sheng, Zihao and Zhao, Xin and Wen, Tuopu and Fu, Zheng and Chen, Sikai and Jiang, Kun and Yang, Diange and Choi, Seongjin and Sun, Lijun}, title = {A Survey on Vision-Language-Action Models for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4524-4536} }
TinyBEV: Cross-Modal Knowledge Distillation for Efficient Multi-Task Bird's-Eye-View Perception and Planning-
[pdf]
[bibtex]@InProceedings{Khan_2025_ICCV, author = {Khan, Reeshad and Gauch, John}, title = {TinyBEV: Cross-Modal Knowledge Distillation for Efficient Multi-Task Bird's-Eye-View Perception and Planning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4577-4585} }
From Static to Dynamic: a Survey of Topology-Aware Perception \\ in Autonomous Driving-
[pdf]
[arXiv]
[bibtex]@InProceedings{Chen_2025_ICCV, author = {Chen, Yixiao and Yang, Ruining and Chen, Xin and He, Jia and Xu, Dongliang and Yao, Yue}, title = {From Static to Dynamic: a Survey of Topology-Aware Perception {\textbackslash}{\textbackslash} in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4511-4523} }
Analyzing Closed-loop Training Techniques for Realistic Traffic Agent Models in Autonomous Highway Driving Simulations-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bitzer_2025_ICCV, author = {Bitzer, Matthias and Cimurs, Reinis and Coors, Benjamin and Goth, Johannes and Ziesche, Sebastian and Geiger, Philipp and Naumann, Maximilian}, title = {Analyzing Closed-loop Training Techniques for Realistic Traffic Agent Models in Autonomous Highway Driving Simulations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4557-4566} }
Distillation Improves Visual Place Recognition for Low Quality Images-
[pdf]
[arXiv]
[bibtex]@InProceedings{Yang_2025_ICCV, author = {Yang, Anbang and Jin, Ge and Huang, Junjie and Wang, Yao and Rizzo, John-Ross and Feng, Chen}, title = {Distillation Improves Visual Place Recognition for Low Quality Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4501-4510} }
SafeRoute: Enhancing Traffic Scene Understanding via a Unified Deep Learning and Multimodal LLM-
[pdf]
[supp]
[bibtex]@InProceedings{Shaw_2025_ICCV, author = {Shaw, Ankit Kumar and Sah, Chandan Kumar and Lian, Xiaoli and Baig, Arsalan Shahid and Wen, Tuopu and Jiang, Kun and Yang, Mengmeng and Yang, Diange and Zhang, Li}, title = {SafeRoute: Enhancing Traffic Scene Understanding via a Unified Deep Learning and Multimodal LLM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4547-4556} }
SynSHRP2: A Synthetic Multimodal Benchmark for Driving Safety-critical Events Derived from Real-world Driving Data-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Shi_2025_ICCV, author = {Shi, Liang and Jiang, Boyu and Yuan, Zhenyuan and Perez, Miguel A. and Guo, Feng}, title = {SynSHRP2: A Synthetic Multimodal Benchmark for Driving Safety-critical Events Derived from Real-world Driving Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4586-4596} }
