Pretraining


COMEDIAN: Self-Supervised Learning and Knowledge Distillation for Action Spotting Using Transformers
Julien Denize,
Mykola Liashuha,
Jaonary Rabarisoa,
Astrid Orcesi,
Romain Hérault
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Denize_2024_WACV, author = {Denize, Julien and Liashuha, Mykola and Rabarisoa, Jaonary and Orcesi, Astrid and H\'erault, Romain}, title = {COMEDIAN: Self-Supervised Learning and Knowledge Distillation for Action Spotting Using Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {530-540} }

Self-Supervised Pre-Training for Semantic Segmentation in an Indoor Scene
Sulabh Shrestha,
Yimeng Li,
Jana Košecká
[pdf] [supp]
[bibtex]
@InProceedings{Shrestha_2024_WACV, author = {Shrestha, Sulabh and Li, Yimeng and Ko\v{s}eck\'a, Jana}, title = {Self-Supervised Pre-Training for Semantic Segmentation in an Indoor Scene}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {625-635} }

E-ViLM: Efficient Video-Language Model via Masked Video Modeling With Semantic Vector-Quantized Tokenizer
Zhiyuan Fang,
Skyler Zheng,
Vasu Sharma,
Robinson Piramuthu
[pdf]
[bibtex]
@InProceedings{Fang_2024_WACV, author = {Fang, Zhiyuan and Zheng, Skyler and Sharma, Vasu and Piramuthu, Robinson}, title = {E-ViLM: Efficient Video-Language Model via Masked Video Modeling With Semantic Vector-Quantized Tokenizer}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {518-529} }

Metric Learning for 3D Point Clouds Using Optimal Transport
Siddharth Katageri,
Srinjay Sarkar,
Charu Sharma
[pdf] [supp]
[bibtex]
@InProceedings{Katageri_2024_WACV, author = {Katageri, Siddharth and Sarkar, Srinjay and Sharma, Charu}, title = {Metric Learning for 3D Point Clouds Using Optimal Transport}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {561-569} }

Does the Fairness of Your Pre-Training Hold Up? Examining the Influence of Pre-Training Techniques on Skin Tone Bias in Skin Lesion Classification
Pratinav Seth,
Abhilash K. Pai
[pdf]
[bibtex]
@InProceedings{Seth_2024_WACV, author = {Seth, Pratinav and Pai, Abhilash K.}, title = {Does the Fairness of Your Pre-Training Hold Up? Examining the Influence of Pre-Training Techniques on Skin Tone Bias in Skin Lesion Classification}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {570-577} }

Semi-Supervised Cross-Spectral Face Recognition With Small Datasets
Anirudh Nanduri,
Rama Chellappa
[pdf]
[bibtex]
@InProceedings{Nanduri_2024_WACV, author = {Nanduri, Anirudh and Chellappa, Rama}, title = {Semi-Supervised Cross-Spectral Face Recognition With Small Datasets}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {588-596} }

Labeling Indoor Scenes With Fusion of Out-of-the-Box Perception Models
Yimeng Li,
Navid Rajabi,
Sulabh Shrestha,
Reza Alimoor,
Jana Košecká
[pdf] [supp]
[bibtex]
@InProceedings{Li_2024_WACV, author = {Li, Yimeng and Rajabi, Navid and Shrestha, Sulabh and Alimoor, Reza and Ko\v{s}eck\'a, Jana}, title = {Labeling Indoor Scenes With Fusion of Out-of-the-Box Perception Models}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {578-587} }

RDIR: Capturing Temporally-Invariant Representations of Multiple Objects in Videos
Piotr Zieliński,
Tomasz Kajdanowicz
[pdf] [supp]
[bibtex]
@InProceedings{Zielinski_2024_WACV, author = {Zieli\'nski, Piotr and Kajdanowicz, Tomasz}, title = {RDIR: Capturing Temporally-Invariant Representations of Multiple Objects in Videos}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {597-606} }

SLVP: Self-Supervised Language-Video Pre-Training for Referring Video Object Segmentation
Jie Mei,
AJ Piergiovanni,
Jenq-Neng Hwang,
Wei Li
[pdf]
[bibtex]
@InProceedings{Mei_2024_WACV, author = {Mei, Jie and Piergiovanni, AJ and Hwang, Jenq-Neng and Li, Wei}, title = {SLVP: Self-Supervised Language-Video Pre-Training for Referring Video Object Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {507-517} }

How Does Contrastive Learning Organize Images?
Yunzhe Zhang,
Yao Lu,
Qi Xuan
[pdf] [supp]
[bibtex]
@InProceedings{Zhang_2024_WACV, author = {Zhang, Yunzhe and Lu, Yao and Xuan, Qi}, title = {How Does Contrastive Learning Organize Images?}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {497-506} }

Zero-Shot Edge Detection With SCESAME: Spectral Clustering-Based Ensemble for Segment Anything Model Estimation
Hiroaki Yamagiwa,
Yusuke Takase,
Hiroyuki Kambe,
Ryosuke Nakamoto
[pdf]
[bibtex]
@InProceedings{Yamagiwa_2024_WACV, author = {Yamagiwa, Hiroaki and Takase, Yusuke and Kambe, Hiroyuki and Nakamoto, Ryosuke}, title = {Zero-Shot Edge Detection With SCESAME: Spectral Clustering-Based Ensemble for Segment Anything Model Estimation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {541-551} }

Source-Free Domain Adaptation for RGB-D Semantic Segmentation With Vision Transformers
Giulia Rizzoli,
Donald Shenaj,
Pietro Zanuttigh
[pdf] [supp]
[bibtex]
@InProceedings{Rizzoli_2024_WACV, author = {Rizzoli, Giulia and Shenaj, Donald and Zanuttigh, Pietro}, title = {Source-Free Domain Adaptation for RGB-D Semantic Segmentation With Vision Transformers}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {615-624} }

Cross-Modal Contrastive Learning With Asymmetric Co-Attention Network for Video Moment Retrieval
Love Panta,
Prashant Shrestha,
Brabeem Sapkota,
Amrita Bhattarai,
Suresh Manandhar,
Anand Kumar Sah
[pdf]
[bibtex]
@InProceedings{Panta_2024_WACV, author = {Panta, Love and Shrestha, Prashant and Sapkota, Brabeem and Bhattarai, Amrita and Manandhar, Suresh and Sah, Anand Kumar}, title = {Cross-Modal Contrastive Learning With Asymmetric Co-Attention Network for Video Moment Retrieval}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {607-614} }

Evaluating Pretrained Models for Deployable Lifelong Learning
Kiran Lekkala,
Eshan Bhargava,
Laurent Itti
[pdf]
[bibtex]
@InProceedings{Lekkala_2024_WACV, author = {Lekkala, Kiran and Bhargava, Eshan and Itti, Laurent}, title = {Evaluating Pretrained Models for Deployable Lifelong Learning}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {552-560} }

A Unified Framework for Cropland Field Boundary Detection and Segmentation
Rodrigo Fill Rangel,
Vítor Nascimento Lourenço,
Lucas Volochen Oldoni,
Ana Flavia Carrara Bonamigo,
Wallas Santos,
Bruno Silva Oliveira,
Mateus Neves Barreto
[pdf]
[bibtex]
@InProceedings{Rangel_2024_WACV, author = {Rangel, Rodrigo Fill and Louren\c{c}o, V{\'\i}tor Nascimento and Oldoni, Lucas Volochen and Bonamigo, Ana Flavia Carrara and Santos, Wallas and Oliveira, Bruno Silva and Barreto, Mateus Neves}, title = {A Unified Framework for Cropland Field Boundary Detection and Segmentation}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV) Workshops}, month = {January}, year = {2024}, pages = {636-644} }