CVPR 2024 Open Access Repository

L3D-IVU: 3rd Workshop on Learning with Limited Labelled Data for Image and Video Understanding

Open-world Instance Segmentation: Top-down Learning with Bottom-up Supervision: Tarun Kalluri,

Weiyao Wang,

Heng Wang,

Manmohan Chandraker,

Lorenzo Torresani,

Du Tran; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kalluri_2024_CVPR, author = {Kalluri, Tarun and Wang, Weiyao and Wang, Heng and Chandraker, Manmohan and Torresani, Lorenzo and Tran, Du}, title = {Open-world Instance Segmentation: Top-down Learning with Bottom-up Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2693-2703} }
Human-in-the-Loop Segmentation of Multi-species Coral Imagery: Scarlett Raine,

Ross Marchant,

Brano Kusy,

Frederic Maire,

Niko Sunderhauf,

Tobias Fischer; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Raine_2024_CVPR, author = {Raine, Scarlett and Marchant, Ross and Kusy, Brano and Maire, Frederic and Sunderhauf, Niko and Fischer, Tobias}, title = {Human-in-the-Loop Segmentation of Multi-species Coral Imagery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2723-2732} }
Learnable Prompt for Few-Shot Semantic Segmentation in Remote Sensing Domain: Steve Andreas Immanuel,

Hagai Raja Sinulingga; [pdf] [arXiv]
[bibtex]
@InProceedings{Immanuel_2024_CVPR, author = {Immanuel, Steve Andreas and Sinulingga, Hagai Raja}, title = {Learnable Prompt for Few-Shot Semantic Segmentation in Remote Sensing Domain}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2755-2761} }
Zero-Shot Monocular Motion Segmentation in the Wild by Combining Deep Learning with Geometric Motion Model Fusion: Yuxiang Huang,

Yuhao Chen,

John Zelek; [pdf] [arXiv]
[bibtex]
@InProceedings{Huang_2024_CVPR, author = {Huang, Yuxiang and Chen, Yuhao and Zelek, John}, title = {Zero-Shot Monocular Motion Segmentation in the Wild by Combining Deep Learning with Geometric Motion Model Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2733-2743} }
Weakly-Supervised Temporal Action Localization with Multi-Modal Plateau Transformers: Xin Hu,

Kai Li,

Deep Patel,

Erik Kruus,

Martin Renqiang Min,

Zhengming Ding; [pdf] [supp]
[bibtex]
@InProceedings{Hu_2024_CVPR, author = {Hu, Xin and Li, Kai and Patel, Deep and Kruus, Erik and Min, Martin Renqiang and Ding, Zhengming}, title = {Weakly-Supervised Temporal Action Localization with Multi-Modal Plateau Transformers}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2704-2713} }
UVIS: Unsupervised Video Instance Segmentation: Shuaiyi Huang,

Saksham Suri,

Kamal Gupta,

Sai Saketh Rambhatla,

Ser-Nam Lim,

Abhinav Shrivastava; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2024_CVPR, author = {Huang, Shuaiyi and Suri, Saksham and Gupta, Kamal and Rambhatla, Sai Saketh and Lim, Ser-Nam and Shrivastava, Abhinav}, title = {UVIS: Unsupervised Video Instance Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2682-2692} }
Active Transferability Estimation: Tarun Ram Menta,

Surgan Jandial,

Akash Patil,

Saketh Bachu,

Vimal K.B,

Balaji Krishnamurthy,

Vineeth N. Balasubramanian,

Mausoom Sarkar,

Chirag Agarwal; [pdf] [supp]
[bibtex]
@InProceedings{Menta_2024_CVPR, author = {Menta, Tarun Ram and Jandial, Surgan and Patil, Akash and Bachu, Saketh and K.B, Vimal and Krishnamurthy, Balaji and Balasubramanian, Vineeth N. and Sarkar, Mausoom and Agarwal, Chirag}, title = {Active Transferability Estimation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2659-2670} }
SemiGPC: Distribution-Aware Label Refinement for Imbalanced Semi-Supervised Learning Using Gaussian Processes: Abdelhak Lemkhenter,

Manchen Wang,

Luca Zancato,

Gurumurthy Swaminathan,

Paolo Favaro,

Davide Modolo; [pdf] [arXiv]
[bibtex]
@InProceedings{Lemkhenter_2024_CVPR, author = {Lemkhenter, Abdelhak and Wang, Manchen and Zancato, Luca and Swaminathan, Gurumurthy and Favaro, Paolo and Modolo, Davide}, title = {SemiGPC: Distribution-Aware Label Refinement for Imbalanced Semi-Supervised Learning Using Gaussian Processes}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2576-2585} }
Enrich Distill and Fuse: Generalized Few-Shot Semantic Segmentation in Remote Sensing Leveraging Foundation Model's Assistance: Tianyi Gao,

Wei Ao,

Xing-Ao Wang,

Yuanhao Zhao,

Ping Ma,

Mengjie Xie,

Hang Fu,

Jinchang Ren,

Zhi Gao; [pdf]
[bibtex]
@InProceedings{Gao_2024_CVPR, author = {Gao, Tianyi and Ao, Wei and Wang, Xing-Ao and Zhao, Yuanhao and Ma, Ping and Xie, Mengjie and Fu, Hang and Ren, Jinchang and Gao, Zhi}, title = {Enrich Distill and Fuse: Generalized Few-Shot Semantic Segmentation in Remote Sensing Leveraging Foundation Model's Assistance}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2771-2780} }
Dynamic Knowledge Adapter with Probabilistic Calibration for Generalized Few-Shot Semantic Segmentation: Jintao Tong,

Haichen Zhou,

Yicong Liu,

Yiman Hu,

Yixiong Zou; [pdf]
[bibtex]
@InProceedings{Tong_2024_CVPR, author = {Tong, Jintao and Zhou, Haichen and Liu, Yicong and Hu, Yiman and Zou, Yixiong}, title = {Dynamic Knowledge Adapter with Probabilistic Calibration for Generalized Few-Shot Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2781-2790} }
Uncertainty-based Forgetting Mitigation for Generalized Few-Shot Object Detection: Karim Guirguis,

George Eskandar,

Mingyang Wang,

Matthias Kayser,

Eduardo Monari,

Bin Yang,

Jürgen Beyerer; [pdf]
[bibtex]
@InProceedings{Guirguis_2024_CVPR, author = {Guirguis, Karim and Eskandar, George and Wang, Mingyang and Kayser, Matthias and Monari, Eduardo and Yang, Bin and Beyerer, J\"urgen}, title = {Uncertainty-based Forgetting Mitigation for Generalized Few-Shot Object Detection}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2586-2595} }
Image-caption Difficulty for Efficient Weakly-supervised Object Detection from In-the-wild Data: Giacomo Nebbia,

Adriana Kovashka; [pdf]
[bibtex]
@InProceedings{Nebbia_2024_CVPR, author = {Nebbia, Giacomo and Kovashka, Adriana}, title = {Image-caption Difficulty for Efficient Weakly-supervised Object Detection from In-the-wild Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2596-2605} }
MoDA: Leveraging Motion Priors from Videos for Advancing Unsupervised Domain Adaptation in Semantic Segmentation: Fei Pan,

Xu Yin,

Seokju Lee,

Axi Niu,

Sungeui Yoon,

In So Kweon; [pdf] [arXiv]
[bibtex]
@InProceedings{Pan_2024_CVPR, author = {Pan, Fei and Yin, Xu and Lee, Seokju and Niu, Axi and Yoon, Sungeui and Kweon, In So}, title = {MoDA: Leveraging Motion Priors from Videos for Advancing Unsupervised Domain Adaptation in Semantic Segmentation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2649-2658} }
Generalized Few-Shot Meets Remote Sensing: Discovering Novel Classes in Land Cover Mapping via Hybrid Semantic Segmentation Framework: Zhuohong Li,

Fangxiao Lu,

Jiaqi Zou,

Lei Hu,

Hongyan Zhang; [pdf] [arXiv]
[bibtex]
@InProceedings{Li_2024_CVPR, author = {Li, Zhuohong and Lu, Fangxiao and Zou, Jiaqi and Hu, Lei and Zhang, Hongyan}, title = {Generalized Few-Shot Meets Remote Sensing: Discovering Novel Classes in Land Cover Mapping via Hybrid Semantic Segmentation Framework}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2744-2754} }
CDAD-Net: Bridging Domain Gaps in Generalized Category Discovery: Sai Bhargav Rongali,

Sarthak Mehrotra,

Ankit Jha,

Mohamad Hassan N C,

Shirsha Bose,

Tanisha Gupta,

Mainak Singha,

Biplab Banerjee; [pdf] [supp]
[bibtex]
@InProceedings{Rongali_2024_CVPR, author = {Rongali, Sai Bhargav and Mehrotra, Sarthak and Jha, Ankit and C, Mohamad Hassan N and Bose, Shirsha and Gupta, Tanisha and Singha, Mainak and Banerjee, Biplab}, title = {CDAD-Net: Bridging Domain Gaps in Generalized Category Discovery}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2616-2626} }
Latent-based Diffusion Model for Long-tailed Recognition: Pengxiao Han,

Changkun Ye,

Jieming Zhou,

Jing Zhang,

Jie Hong,

Xuesong Li; [pdf] [arXiv]
[bibtex]
@InProceedings{Han_2024_CVPR, author = {Han, Pengxiao and Ye, Changkun and Zhou, Jieming and Zhang, Jing and Hong, Jie and Li, Xuesong}, title = {Latent-based Diffusion Model for Long-tailed Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2639-2648} }
On Accuracy and Speed of Geodesic Regression: Do Geometric Priors Improve Learning on Small Datasets?: Adele Myers,

Nina Miolane; [pdf] [supp]
[bibtex]
@InProceedings{Myers_2024_CVPR, author = {Myers, Adele and Miolane, Nina}, title = {On Accuracy and Speed of Geodesic Regression: Do Geometric Priors Improve Learning on Small Datasets?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2714-2722} }
What is Point Supervision Worth in Video Instance Segmentation?: Shuaiyi Huang,

De-An Huang,

Zhiding Yu,

Shiyi Lan,

Subhashree Radhakrishnan,

Jose M. Alvarez,

Abhinav Shrivastava,

Anima Anandkumar; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Huang_2024_CVPR, author = {Huang, Shuaiyi and Huang, De-An and Yu, Zhiding and Lan, Shiyi and Radhakrishnan, Subhashree and Alvarez, Jose M. and Shrivastava, Abhinav and Anandkumar, Anima}, title = {What is Point Supervision Worth in Video Instance Segmentation?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2671-2681} }
Audio-Visual Generalized Zero-Shot Learning using Pre-Trained Large Multi-Modal Models: David Kurzendörfer,

Otniel-Bogdan Mercea,

A. Sophia Koepke,

Zeynep Akata; [pdf] [supp]
[bibtex]
@InProceedings{Kurzendorfer_2024_CVPR, author = {Kurzend\"orfer, David and Mercea, Otniel-Bogdan and Koepke, A. Sophia and Akata, Zeynep}, title = {Audio-Visual Generalized Zero-Shot Learning using Pre-Trained Large Multi-Modal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2627-2638} }
Learning Tracking Representations from Single Point Annotations: Qiangqiang Wu,

Antoni B. Chan; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wu_2024_CVPR, author = {Wu, Qiangqiang and Chan, Antoni B.}, title = {Learning Tracking Representations from Single Point Annotations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {2606-2615} }