Pretraining Large Vision and Multimodal Models


Benefits of Synthetically Pre-Trained Depth-Prediction Networks for Indoor/Outdoor Image Classification
Kelly X. Lin,
Irene Cho,
Amey Walimbe,
Bryan A. Zamora,
Alex Rich,
Sirius Z. Zhang,
Tobias Höllerer
[pdf]
[bibtex]
@InProceedings{Lin_2023_WACV, author = {Lin, Kelly X. and Cho, Irene and Walimbe, Amey and Zamora, Bryan A. and Rich, Alex and Zhang, Sirius Z. and H\"ollerer, Tobias}, title = {Benefits of Synthetically Pre-Trained Depth-Prediction Networks for Indoor/Outdoor Image Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {360-369} }

Scalable and Accurate Self-Supervised Multimodal Representation Learning Without Aligned Video and Text Data
Vladislav Lialin,
Stephen Rawls,
David Chan,
Shalini Ghosh,
Anna Rumshisky,
Wael Hamza
[pdf]
[bibtex]
@InProceedings{Lialin_2023_WACV, author = {Lialin, Vladislav and Rawls, Stephen and Chan, David and Ghosh, Shalini and Rumshisky, Anna and Hamza, Wael}, title = {Scalable and Accurate Self-Supervised Multimodal Representation Learning Without Aligned Video and Text Data}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {390-400} }

Masked Autoencoder for Self-Supervised Pre-Training on Lidar Point Clouds
Georg Hess,
Johan Jaxing,
Elias Svensson,
David Hagerman,
Christoffer Petersson,
Lennart Svensson
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Hess_2023_WACV, author = {Hess, Georg and Jaxing, Johan and Svensson, Elias and Hagerman, David and Petersson, Christoffer and Svensson, Lennart}, title = {Masked Autoencoder for Self-Supervised Pre-Training on Lidar Point Clouds}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {350-359} }

MixGen: A New Multi-Modal Data Augmentation
Xiaoshuai Hao,
Yi Zhu,
Srikar Appalaraju,
Aston Zhang,
Wanqian Zhang,
Bo Li,
Mu Li
[pdf] [arXiv]
[bibtex]
@InProceedings{Hao_2023_WACV, author = {Hao, Xiaoshuai and Zhu, Yi and Appalaraju, Srikar and Zhang, Aston and Zhang, Wanqian and Li, Bo and Li, Mu}, title = {MixGen: A New Multi-Modal Data Augmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {379-389} }

RarePlanes Soar Higher: Self-Supervised Pretraining for Resource Constrained and Synthetic Datasets
Justin Downes,
Will Gleave,
Dan Nakada
[pdf]
[bibtex]
@InProceedings{Downes_2023_WACV, author = {Downes, Justin and Gleave, Will and Nakada, Dan}, title = {RarePlanes Soar Higher: Self-Supervised Pretraining for Resource Constrained and Synthetic Datasets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2023}, pages = {370-378} }