WACV 2023 Open Access Repository

Pretraining Large Vision and Multimodal Models

Benefits of Synthetically Pre-Trained Depth-Prediction Networks for Indoor/Outdoor Image Classification: Kelly X. Lin,

Irene Cho,

Amey Walimbe,

Bryan A. Zamora,

Alex Rich,

Sirius Z. Zhang,

Tobias Höllerer; [pdf]
[bibtex]
@InProceedings{Lin_2023_WACV, author = {Lin, Kelly X. and Cho, Irene and Walimbe, Amey and Zamora, Bryan A. and Rich, Alex and Zhang, Sirius Z. and H\"ollerer, Tobias}, title = {Benefits of Synthetically Pre-Trained Depth-Prediction Networks for Indoor/Outdoor Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {360-369} }
Scalable and Accurate Self-Supervised Multimodal Representation Learning Without Aligned Video and Text Data: Vladislav Lialin,

Stephen Rawls,

David Chan,

Shalini Ghosh,

Anna Rumshisky,

Wael Hamza; [pdf]
[bibtex]
@InProceedings{Lialin_2023_WACV, author = {Lialin, Vladislav and Rawls, Stephen and Chan, David and Ghosh, Shalini and Rumshisky, Anna and Hamza, Wael}, title = {Scalable and Accurate Self-Supervised Multimodal Representation Learning Without Aligned Video and Text Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {390-400} }
Masked Autoencoder for Self-Supervised Pre-Training on Lidar Point Clouds: Georg Hess,

Johan Jaxing,

Elias Svensson,

David Hagerman,

Christoffer Petersson,

Lennart Svensson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hess_2023_WACV, author = {Hess, Georg and Jaxing, Johan and Svensson, Elias and Hagerman, David and Petersson, Christoffer and Svensson, Lennart}, title = {Masked Autoencoder for Self-Supervised Pre-Training on Lidar Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {350-359} }
MixGen: A New Multi-Modal Data Augmentation: Xiaoshuai Hao,

Yi Zhu,

Srikar Appalaraju,

Aston Zhang,

Wanqian Zhang,

Bo Li,

Mu Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Hao_2023_WACV, author = {Hao, Xiaoshuai and Zhu, Yi and Appalaraju, Srikar and Zhang, Aston and Zhang, Wanqian and Li, Bo and Li, Mu}, title = {MixGen: A New Multi-Modal Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {379-389} }
RarePlanes Soar Higher: Self-Supervised Pretraining for Resource Constrained and Synthetic Datasets: Justin Downes,

Will Gleave,

Dan Nakada; [pdf]
[bibtex]
@InProceedings{Downes_2023_WACV, author = {Downes, Justin and Gleave, Will and Nakada, Dan}, title = {RarePlanes Soar Higher: Self-Supervised Pretraining for Resource Constrained and Synthetic Datasets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {370-378} }