1st Workshop on Open-Vocabulary 3D Scene Understanding


Dynamic Texts From UAV Perspective Natural Images
Hidetomo Sakaino
[pdf]
[bibtex]
@InProceedings{Sakaino_2023_ICCV, author = {Sakaino, Hidetomo}, title = {Dynamic Texts From UAV Perspective Natural Images}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2070-2081} }

CLIP-FO3D: Learning Free Open-World 3D Scene Representations from 2D Dense CLIP
Junbo Zhang,
Runpei Dong,
Kaisheng Ma
[pdf]
[bibtex]
@InProceedings{Zhang_2023_ICCV, author = {Zhang, Junbo and Dong, Runpei and Ma, Kaisheng}, title = {CLIP-FO3D: Learning Free Open-World 3D Scene Representations from 2D Dense CLIP}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2048-2059} }

The Change You Want to See (Now in 3D)
Ragav Sachdeva,
Andrew Zisserman
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sachdeva_2023_ICCV, author = {Sachdeva, Ragav and Zisserman, Andrew}, title = {The Change You Want to See (Now in 3D)}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2060-2069} }

Learning to Prompt CLIP for Monocular Depth Estimation: Exploring the Limits of Human Language
Dylan Auty,
Krystian Mikolajczyk
[pdf] [supp]
[bibtex]
@InProceedings{Auty_2023_ICCV, author = {Auty, Dylan and Mikolajczyk, Krystian}, title = {Learning to Prompt CLIP for Monocular Depth Estimation: Exploring the Limits of Human Language}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2039-2047} }

CLIP Goes 3D: Leveraging Prompt Tuning for Language Grounded 3D Recognition
Deepti Hegde,
Jeya Maria Jose Valanarasu,
Vishal Patel
[pdf] [arXiv]
[bibtex]
@InProceedings{Hegde_2023_ICCV, author = {Hegde, Deepti and Valanarasu, Jeya Maria Jose and Patel, Vishal}, title = {CLIP Goes 3D: Leveraging Prompt Tuning for Language Grounded 3D Recognition}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2028-2038} }