Large Language and Vision Models for Autonomous Driving


VLA4CoDrive: Vision-Language-Action Dataset for Cooperative Autonomous Driving
Sayed Pedram Haeri Boroujeni,
Abolfazl Razi
[pdf]
[bibtex]
@InProceedings{Boroujeni_2026_WACV, author = {Boroujeni, Sayed Pedram Haeri and Razi, Abolfazl}, title = {VLA4CoDrive: Vision-Language-Action Dataset for Cooperative Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1789-1799} }

Lightweight Multi-Scale Fusion for Real-Time Autonomous Driving Segmentation
Muhammad Nadeem,
Hyeyoung Lee
[pdf]
[bibtex]
@InProceedings{Nadeem_2026_WACV, author = {Nadeem, Muhammad and Lee, Hyeyoung}, title = {Lightweight Multi-Scale Fusion for Real-Time Autonomous Driving Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1721-1728} }

Efficient Visual Question Answering Pipeline for Autonomous Driving via Scene Region Compression
Yuliang Cai,
Dongqiangzi Ye,
Zitian Chen,
Chongruo Wu
[pdf] [arXiv]
[bibtex]
@InProceedings{Cai_2026_WACV, author = {Cai, Yuliang and Ye, Dongqiangzi and Chen, Zitian and Wu, Chongruo}, title = {Efficient Visual Question Answering Pipeline for Autonomous Driving via Scene Region Compression}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1739-1746} }

FROST-Drive: Scalable and Efficient End-to-End Driving with a Frozen Vision Encoder
Zeyu Dong,
Yimin Zhu,
Yu Wu,
Yu Sun
[pdf] [arXiv]
[bibtex]
@InProceedings{Dong_2026_WACV, author = {Dong, Zeyu and Zhu, Yimin and Wu, Yu and Sun, Yu}, title = {FROST-Drive: Scalable and Efficient End-to-End Driving with a Frozen Vision Encoder}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1729-1738} }

2COOOL: An Evaluation Benchmark for Generating Incident Reports on Out-of-Distribution Hazards in Autonomous Driving
Ali K. AlShami,
Ryan Rabinowitz,
Terrance E. Boult,
Jugal Kalita
[pdf]
[bibtex]
@InProceedings{AlShami_2026_WACV, author = {AlShami, Ali K. and Rabinowitz, Ryan and Boult, Terrance E. and Kalita, Jugal}, title = {2COOOL: An Evaluation Benchmark for Generating Incident Reports on Out-of-Distribution Hazards in Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1800-1809} }

Role of Language-Guidance in Knowledge Distillation for Semantic Segmentation Under Limited Field-Of-View Autonomous Driving
Yeon Woo Shin,
Keun Hee Park,
Pavan Turaga,
Eun Som Jeon
[pdf] [supp]
[bibtex]
@InProceedings{Shin_2026_WACV, author = {Shin, Yeon Woo and Park, Keun Hee and Turaga, Pavan and Jeon, Eun Som}, title = {Role of Language-Guidance in Knowledge Distillation for Semantic Segmentation Under Limited Field-Of-View Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1761-1771} }

Benchmarking Vision-Language Models for Traffic Scene Understanding in Inclement Winter Weather: The AWDB Benchmark
Ali Awad,
Tagore Kosireddy,
Krishna Mokkapati,
Nibendra Bajracharya,
Ashraf Saleem,
Vinh Nguyen,
Evan Lucas
[pdf]
[bibtex]
@InProceedings{Awad_2026_WACV, author = {Awad, Ali and Kosireddy, Tagore and Mokkapati, Krishna and Bajracharya, Nibendra and Saleem, Ashraf and Nguyen, Vinh and Lucas, Evan}, title = {Benchmarking Vision-Language Models for Traffic Scene Understanding in Inclement Winter Weather: The AWDB Benchmark}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1747-1760} }

GATEPose: A Graph Attention Transformer Enhanced with Pose and Orientation Angles for Pedestrian Crossing Intention Prediction
Ali K. AlShami,
Terrance E. Boult,
Jugal Kalita
[pdf]
[bibtex]
@InProceedings{AlShami_2026_WACV, author = {AlShami, Ali K. and Boult, Terrance E. and Kalita, Jugal}, title = {GATEPose: A Graph Attention Transformer Enhanced with Pose and Orientation Angles for Pedestrian Crossing Intention Prediction}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1810-1819} }

Trust-Guided Multimodal LLM Integration with Reinforcement Learning for Autonomous Driving
Sairam Chennaka,
Jaswanth Nidamanuri
[pdf] [supp]
[bibtex]
@InProceedings{Chennaka_2026_WACV, author = {Chennaka, Sairam and Nidamanuri, Jaswanth}, title = {Trust-Guided Multimodal LLM Integration with Reinforcement Learning for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1780-1788} }

Less Is More: Agentic Prompt Design for Safe VLM Action Selection
Elahe Yahyapour,
Chengbo Ai
[pdf] [supp]
[bibtex]
@InProceedings{Yahyapour_2026_WACV, author = {Yahyapour, Elahe and Ai, Chengbo}, title = {Less Is More: Agentic Prompt Design for Safe VLM Action Selection}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {March}, year = {2026}, pages = {1772-1779} }