Workshop on Distillation of Foundation Models for Autonomous Driving


Cross-Camera Module Training of Raw Sensor Data-Based Automotive Machine Vision: Challenges and Solutions
Setareh Kian,
Shannon Brooks-Lehnert,
Keigo Hirakawa
[pdf] [supp]
[bibtex]
@InProceedings{Kian_2025_ICCV, author = {Kian, Setareh and Brooks-Lehnert, Shannon and Hirakawa, Keigo}, title = {Cross-Camera Module Training of Raw Sensor Data-Based Automotive Machine Vision: Challenges and Solutions}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4537-4546} }

NuScenes-SpatialQA: A Spatial Understanding and Reasoning Benchmark for Vision-Language Models in Autonomous Driving
Kexin Tian,
Jingrui Mao,
Yunlong Zhang,
Jiwan Jiang,
Yang Zhou,
Zhengzhong Tu
[pdf] [supp]
[bibtex]
@InProceedings{Tian_2025_ICCV, author = {Tian, Kexin and Mao, Jingrui and Zhang, Yunlong and Jiang, Jiwan and Zhou, Yang and Tu, Zhengzhong}, title = {NuScenes-SpatialQA: A Spatial Understanding and Reasoning Benchmark for Vision-Language Models in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4567-4576} }

A Survey on Vision-Language-Action Models for Autonomous Driving
Sicong Jiang,
Zilin Huang,
Kangan Qian,
Ziang Luo,
Tianze Zhu,
Yang Zhong,
Yihong Tang,
Menglin Kong,
Yunlong Wang,
Siwen Jiao,
Hao Ye,
Zihao Sheng,
Xin Zhao,
Tuopu Wen,
Zheng Fu,
Sikai Chen,
Kun Jiang,
Diange Yang,
Seongjin Choi,
Lijun Sun
[pdf] [arXiv]
[bibtex]
@InProceedings{Jiang_2025_ICCV, author = {Jiang, Sicong and Huang, Zilin and Qian, Kangan and Luo, Ziang and Zhu, Tianze and Zhong, Yang and Tang, Yihong and Kong, Menglin and Wang, Yunlong and Jiao, Siwen and Ye, Hao and Sheng, Zihao and Zhao, Xin and Wen, Tuopu and Fu, Zheng and Chen, Sikai and Jiang, Kun and Yang, Diange and Choi, Seongjin and Sun, Lijun}, title = {A Survey on Vision-Language-Action Models for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4524-4536} }

TinyBEV: Cross-Modal Knowledge Distillation for Efficient Multi-Task Bird's-Eye-View Perception and Planning
Reeshad Khan,
John Gauch
[pdf]
[bibtex]
@InProceedings{Khan_2025_ICCV, author = {Khan, Reeshad and Gauch, John}, title = {TinyBEV: Cross-Modal Knowledge Distillation for Efficient Multi-Task Bird's-Eye-View Perception and Planning}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4577-4585} }

From Static to Dynamic: a Survey of Topology-Aware Perception \\ in Autonomous Driving
Yixiao Chen,
Ruining Yang,
Xin Chen,
Jia He,
Dongliang Xu,
Yue Yao
[pdf] [arXiv]
[bibtex]
@InProceedings{Chen_2025_ICCV, author = {Chen, Yixiao and Yang, Ruining and Chen, Xin and He, Jia and Xu, Dongliang and Yao, Yue}, title = {From Static to Dynamic: a Survey of Topology-Aware Perception {\textbackslash}{\textbackslash} in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4511-4523} }

Analyzing Closed-loop Training Techniques for Realistic Traffic Agent Models in Autonomous Highway Driving Simulations
Matthias Bitzer,
Reinis Cimurs,
Benjamin Coors,
Johannes Goth,
Sebastian Ziesche,
Philipp Geiger,
Maximilian Naumann
[pdf] [arXiv]
[bibtex]
@InProceedings{Bitzer_2025_ICCV, author = {Bitzer, Matthias and Cimurs, Reinis and Coors, Benjamin and Goth, Johannes and Ziesche, Sebastian and Geiger, Philipp and Naumann, Maximilian}, title = {Analyzing Closed-loop Training Techniques for Realistic Traffic Agent Models in Autonomous Highway Driving Simulations}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4557-4566} }

Distillation Improves Visual Place Recognition for Low Quality Images
Anbang Yang,
Ge Jin,
Junjie Huang,
Yao Wang,
John-Ross Rizzo,
Chen Feng
[pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2025_ICCV, author = {Yang, Anbang and Jin, Ge and Huang, Junjie and Wang, Yao and Rizzo, John-Ross and Feng, Chen}, title = {Distillation Improves Visual Place Recognition for Low Quality Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4501-4510} }

SafeRoute: Enhancing Traffic Scene Understanding via a Unified Deep Learning and Multimodal LLM
Ankit Kumar Shaw,
Chandan Kumar Sah,
Xiaoli Lian,
Arsalan Shahid Baig,
Tuopu Wen,
Kun Jiang,
Mengmeng Yang,
Diange Yang,
Li Zhang
[pdf] [supp]
[bibtex]
@InProceedings{Shaw_2025_ICCV, author = {Shaw, Ankit Kumar and Sah, Chandan Kumar and Lian, Xiaoli and Baig, Arsalan Shahid and Wen, Tuopu and Jiang, Kun and Yang, Mengmeng and Yang, Diange and Zhang, Li}, title = {SafeRoute: Enhancing Traffic Scene Understanding via a Unified Deep Learning and Multimodal LLM}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4547-4556} }

SynSHRP2: A Synthetic Multimodal Benchmark for Driving Safety-critical Events Derived from Real-world Driving Data
Liang Shi,
Boyu Jiang,
Zhenyuan Yuan,
Miguel A. Perez,
Feng Guo
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Shi_2025_ICCV, author = {Shi, Liang and Jiang, Boyu and Yuan, Zhenyuan and Perez, Miguel A. and Guo, Feng}, title = {SynSHRP2: A Synthetic Multimodal Benchmark for Driving Safety-critical Events Derived from Real-world Driving Data}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {4586-4596} }