Large Language and Vision Models for Autonomous Driving


Human-Centric Autonomous Systems With LLMs for User Command Reasoning
Yi Yang,
Qingwen Zhang,
Ci Li,
Daniel Simões Marta,
Nazre Batool,
John Folkesson
[pdf] [arXiv]
[bibtex]
@InProceedings{Yang_2024_WACV, author = {Yang, Yi and Zhang, Qingwen and Li, Ci and Marta, Daniel Sim\~oes and Batool, Nazre and Folkesson, John}, title = {Human-Centric Autonomous Systems With LLMs for User Command Reasoning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {988-994} }

LIP-Loc: LiDAR Image Pretraining for Cross-Modal Localization
Sai Shubodh,
Mohammad Omama,
Husain Zaidi,
Udit Singh Parihar,
Madhava Krishna
[pdf] [supp]
[bibtex]
@InProceedings{Shubodh_2024_WACV, author = {Shubodh, Sai and Omama, Mohammad and Zaidi, Husain and Parihar, Udit Singh and Krishna, Madhava}, title = {LIP-Loc: LiDAR Image Pretraining for Cross-Modal Localization}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {948-957} }

A Survey on Multimodal Large Language Models for Autonomous Driving
Can Cui,
Yunsheng Ma,
Xu Cao,
Wenqian Ye,
Yang Zhou,
Kaizhao Liang,
Jintai Chen,
Juanwu Lu,
Zichong Yang,
Kuei-Da Liao,
Tianren Gao,
Erlong Li,
Kun Tang,
Zhipeng Cao,
Tong Zhou,
Ao Liu,
Xinrui Yan,
Shuqi Mei,
Jianguo Cao,
Ziran Wang,
Chao Zheng
[pdf]
[bibtex]
@InProceedings{Cui_2024_WACV, author = {Cui, Can and Ma, Yunsheng and Cao, Xu and Ye, Wenqian and Zhou, Yang and Liang, Kaizhao and Chen, Jintai and Lu, Juanwu and Yang, Zichong and Liao, Kuei-Da and Gao, Tianren and Li, Erlong and Tang, Kun and Cao, Zhipeng and Zhou, Tong and Liu, Ao and Yan, Xinrui and Mei, Shuqi and Cao, Jianguo and Wang, Ziran and Zheng, Chao}, title = {A Survey on Multimodal Large Language Models for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {958-979} }

VLAAD: Vision and Language Assistant for Autonomous Driving
SungYeon Park,
MinJae Lee,
JiHyuk Kang,
Hahyeon Choi,
Yoonah Park,
Juhwan Cho,
Adam Lee,
DongKyu Kim
[pdf]
[bibtex]
@InProceedings{Park_2024_WACV, author = {Park, SungYeon and Lee, MinJae and Kang, JiHyuk and Choi, Hahyeon and Park, Yoonah and Cho, Juhwan and Lee, Adam and Kim, DongKyu}, title = {VLAAD: Vision and Language Assistant for Autonomous Driving}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {980-987} }

Drive As You Speak: Enabling Human-Like Interaction With Large Language Models in Autonomous Vehicles
Can Cui,
Yunsheng Ma,
Xu Cao,
Wenqian Ye,
Ziran Wang
[pdf]
[bibtex]
@InProceedings{Cui_2024_WACV, author = {Cui, Can and Ma, Yunsheng and Cao, Xu and Ye, Wenqian and Wang, Ziran}, title = {Drive As You Speak: Enabling Human-Like Interaction With Large Language Models in Autonomous Vehicles}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {902-909} }

NuScenes-MQA: Integrated Evaluation of Captions and QA for Autonomous Driving Datasets Using Markup Annotations
Yuichi Inoue,
Yuki Yada,
Kotaro Tanahashi,
Yu Yamaguchi
[pdf]
[bibtex]
@InProceedings{Inoue_2024_WACV, author = {Inoue, Yuichi and Yada, Yuki and Tanahashi, Kotaro and Yamaguchi, Yu}, title = {NuScenes-MQA: Integrated Evaluation of Captions and QA for Autonomous Driving Datasets Using Markup Annotations}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {930-938} }

Latency Driven Spatially Sparse Optimization for Multi-Branch CNNs for Semantic Segmentation
Georgios Zampokas,
Christos-Savvas Bouganis,
Dimitrios Tzovaras
[pdf]
[bibtex]
@InProceedings{Zampokas_2024_WACV, author = {Zampokas, Georgios and Bouganis, Christos-Savvas and Tzovaras, Dimitrios}, title = {Latency Driven Spatially Sparse Optimization for Multi-Branch CNNs for Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {939-947} }

A Safer Vision-Based Autonomous Planning System for Quadrotor UAVs With Dynamic Obstacle Trajectory Prediction and Its Application With LLMs
Jiageng Zhong,
Ming Li,
Yinliang Chen,
Zihang Wei,
Fan Yang,
Haoran Shen
[pdf]
[bibtex]
@InProceedings{Zhong_2024_WACV, author = {Zhong, Jiageng and Li, Ming and Chen, Yinliang and Wei, Zihang and Yang, Fan and Shen, Haoran}, title = {A Safer Vision-Based Autonomous Planning System for Quadrotor UAVs With Dynamic Obstacle Trajectory Prediction and Its Application With LLMs}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {920-929} }