Foundation Models for V2X-Based Cooperative Autonomous Driving


Can Vision-Language Models Understand and Interpret Dynamic Gestures from Pedestrians? Pilot Datasets and Exploration Towards Instructive Nonverbal Commands for Cooperative Autonomous Vehicles
Tonko E. W. Bossen,
Andreas Møgelmose,
Ross Greer
[pdf]
[bibtex]
@InProceedings{Bossen_2025_CVPR, author = {Bossen, Tonko E. W. and M{\o}gelmose, Andreas and Greer, Ross}, title = {Can Vision-Language Models Understand and Interpret Dynamic Gestures from Pedestrians? Pilot Datasets and Exploration Towards Instructive Nonverbal Commands for Cooperative Autonomous Vehicles}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {4779-4788} }

Exploring Modality Guidance to Enhance VFM-based Feature Fusion for UDA in 3D Semantic Segmentation
Johannes Spoecklberger,
Wei Lin,
Pedro Hermosilla,
Sivan Doveh,
Horst Possegger,
M. Jehanzeb Mirza
[pdf] [arXiv]
[bibtex]
@InProceedings{Spoecklberger_2025_CVPR, author = {Spoecklberger, Johannes and Lin, Wei and Hermosilla, Pedro and Doveh, Sivan and Possegger, Horst and Mirza, M. Jehanzeb}, title = {Exploring Modality Guidance to Enhance VFM-based Feature Fusion for UDA in 3D Semantic Segmentation}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {4789-4798} }

V3LMA: Visual 3D-enhanced Language Model for Autonomous Driving
Jannik Lübberstedt,
Esteban Rivera Guerrero,
Nico Uhlemann,
Markus Lienkamp
[pdf] [supp]
[bibtex]
@InProceedings{Lubberstedt_2025_CVPR, author = {L\"ubberstedt, Jannik and Guerrero, Esteban Rivera and Uhlemann, Nico and Lienkamp, Markus}, title = {V3LMA: Visual 3D-enhanced Language Model for Autonomous Driving}, booktitle = {Proceedings of the Computer Vision and Pattern Recognition Conference (CVPR) Workshops}, month = {June}, year = {2025}, pages = {4769-4778} }