CVPR 2024 Open Access Repository

2nd Workshop on Generative Models for Computer Vision

iEdit: Localised Text-guided Image Editing with Weak Supervision: Rumeysa Bodur,

Erhan Gundogdu,

Binod Bhattarai,

Tae-Kyun Kim,

Michael Donoser,

Loris Bazzani; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bodur_2024_CVPR, author = {Bodur, Rumeysa and Gundogdu, Erhan and Bhattarai, Binod and Kim, Tae-Kyun and Donoser, Michael and Bazzani, Loris}, title = {iEdit: Localised Text-guided Image Editing with Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7426-7435} }
Efficient Exploration of Image Classifier Failures with Bayesian Optimization and Text-to-Image Models: Adrien Le Coz,

Houssem Ouertatani,

Stéphane Herbin,

Faouzi Adjed; [pdf] [arXiv]
[bibtex]
@InProceedings{Le_Coz_2024_CVPR, author = {Le Coz, Adrien and Ouertatani, Houssem and Herbin, St\'ephane and Adjed, Faouzi}, title = {Efficient Exploration of Image Classifier Failures with Bayesian Optimization and Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7569-7578} }
GenVideo: One-shot Target-image and Shape Aware Video Editing using T2I Diffusion Models: Sai Sree Harsha,

Ambareesh Revanur,

Dhwanit Agarwal,

Shradha Agrawal; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Harsha_2024_CVPR, author = {Harsha, Sai Sree and Revanur, Ambareesh and Agarwal, Dhwanit and Agrawal, Shradha}, title = {GenVideo: One-shot Target-image and Shape Aware Video Editing using T2I Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7559-7568} }
Robust Disaster Assessment from Aerial Imagery Using Text-to-Image Synthetic Data: Tarun Kalluri,

Jihyeon Lee,

Kihyuk Sohn,

Sahil Singla,

Manmohan Chandraker,

Joseph Xu,

Jeremiah Liu; [pdf] [arXiv]
[bibtex]
@InProceedings{Kalluri_2024_CVPR, author = {Kalluri, Tarun and Lee, Jihyeon and Sohn, Kihyuk and Singla, Sahil and Chandraker, Manmohan and Xu, Joseph and Liu, Jeremiah}, title = {Robust Disaster Assessment from Aerial Imagery Using Text-to-Image Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7449-7459} }
Style Transfer for 2D Talking Head Generation: Trong Thang Pham,

Tuong Do,

Nhat Le,

Ngan Le,

Hung Nguyen,

Erman Tjiputra,

Quang Tran,

Anh Nguyen; [pdf] [supp]
[bibtex]
@InProceedings{Pham_2024_CVPR, author = {Pham, Trong Thang and Do, Tuong and Le, Nhat and Le, Ngan and Nguyen, Hung and Tjiputra, Erman and Tran, Quang and Nguyen, Anh}, title = {Style Transfer for 2D Talking Head Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7500-7509} }
ART-V: Auto-Regressive Text-to-Video Generation with Diffusion Models: Wenming Weng,

Ruoyu Feng,

Yanhui Wang,

Qi Dai,

Chunyu Wang,

Dacheng Yin,

Zhiyuan Zhao,

Kai Qiu,

Jianmin Bao,

Yuhui Yuan,

Chong Luo,

Yueyi Zhang,

Zhiwei Xiong; [pdf] [supp]
[bibtex]
@InProceedings{Weng_2024_CVPR, author = {Weng, Wenming and Feng, Ruoyu and Wang, Yanhui and Dai, Qi and Wang, Chunyu and Yin, Dacheng and Zhao, Zhiyuan and Qiu, Kai and Bao, Jianmin and Yuan, Yuhui and Luo, Chong and Zhang, Yueyi and Xiong, Zhiwei}, title = {ART-V: Auto-Regressive Text-to-Video Generation with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7395-7405} }
LATENTMAN: Generating Consistent Animated Characters using Image Diffusion Models: Abdelrahman Eldesokey,

Peter Wonka; [pdf] [arXiv]
[bibtex]
@InProceedings{Eldesokey_2024_CVPR, author = {Eldesokey, Abdelrahman and Wonka, Peter}, title = {LATENTMAN: Generating Consistent Animated Characters using Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7510-7519} }
MixSyn: Compositional Image Synthesis with Fuzzy Masks and Style Fusion: Ilke Demir,

Umur Aybars Ciftci; [pdf] [supp]
[bibtex]
@InProceedings{Demir_2024_CVPR, author = {Demir, Ilke and Ciftci, Umur Aybars}, title = {MixSyn: Compositional Image Synthesis with Fuzzy Masks and Style Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7460-7469} }
Gaussian Splatting Decoder for 3D-aware Generative Adversarial Networks: Florian Barthel,

Arian Beckmann,

Wieland Morgenstern,

Anna Hilsmann,

Peter Eisert; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Barthel_2024_CVPR, author = {Barthel, Florian and Beckmann, Arian and Morgenstern, Wieland and Hilsmann, Anna and Eisert, Peter}, title = {Gaussian Splatting Decoder for 3D-aware Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7963-7972} }
Contrastive Clothing and Pose Generation for Cloth-Changing Person Re-Identification: Vuong D. Nguyen,

Pranav Mantini,

Shishir K. Shah; [pdf]
[bibtex]
@InProceedings{Nguyen_2024_CVPR, author = {Nguyen, Vuong D. and Mantini, Pranav and Shah, Shishir K.}, title = {Contrastive Clothing and Pose Generation for Cloth-Changing Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7541-7549} }
PQ-VAE: Learning Hierarchical Discrete Representations with Progressive Quantization: Lun Huang,

Qiang Qiu,

Guillermo Sapiro; [pdf]
[bibtex]
@InProceedings{Huang_2024_CVPR, author = {Huang, Lun and Qiu, Qiang and Sapiro, Guillermo}, title = {PQ-VAE: Learning Hierarchical Discrete Representations with Progressive Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7550-7558} }
OmniControlNet: Dual-stage Integration for Conditional Image Generation: Yilin Wang,

Haiyang Xu,

Xiang Zhang,

Zeyuan Chen,

Zhizhou Sha,

Zirui Wang,

Zhuowen Tu; [pdf] [arXiv]
[bibtex]
@InProceedings{Wang_2024_CVPR, author = {Wang, Yilin and Xu, Haiyang and Zhang, Xiang and Chen, Zeyuan and Sha, Zhizhou and Wang, Zirui and Tu, Zhuowen}, title = {OmniControlNet: Dual-stage Integration for Conditional Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7436-7448} }
StereoDiffusion: Training-Free Stereo Image Generation Using Latent Diffusion Models: Lezhong Wang,

Jeppe Revall Frisvad,

Mark Bo Jensen,

Siavash Arjomand Bigdeli; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Wang_2024_CVPR, author = {Wang, Lezhong and Frisvad, Jeppe Revall and Jensen, Mark Bo and Bigdeli, Siavash Arjomand}, title = {StereoDiffusion: Training-Free Stereo Image Generation Using Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7416-7425} }
Segmentation-Free Guidance for Text-to-Image Diffusion Models: Kambiz Azarian,

Debasmit Das,

Qiqi Hou,

Fatih Porikli; [pdf] [arXiv]
[bibtex]
@InProceedings{Azarian_2024_CVPR, author = {Azarian, Kambiz and Das, Debasmit and Hou, Qiqi and Porikli, Fatih}, title = {Segmentation-Free Guidance for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7520-7529} }
Salient Object-Aware Background Generation using Text-Guided Diffusion Models: Amir Erfan Eshratifar,

Joao V.B. Soares,

Kapil Thadani,

Shaunak Mishra,

Mikhail Kuznetsov,

Yueh-Ning Ku,

Paloma De Juan; [pdf] [arXiv]
[bibtex]
@InProceedings{Eshratifar_2024_CVPR, author = {Eshratifar, Amir Erfan and Soares, Joao V.B. and Thadani, Kapil and Mishra, Shaunak and Kuznetsov, Mikhail and Ku, Yueh-Ning and De Juan, Paloma}, title = {Salient Object-Aware Background Generation using Text-Guided Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7489-7499} }
MVDiff: Scalable and Flexible Multi-view Diffusion for 3D Object Reconstruction from Single-View: Emmanuelle Bourigault,

Pauline Bourigault; [pdf] [arXiv]
[bibtex]
@InProceedings{Bourigault_2024_CVPR, author = {Bourigault, Emmanuelle and Bourigault, Pauline}, title = {MVDiff: Scalable and Flexible Multi-view Diffusion for 3D Object Reconstruction from Single-View}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7579-7586} }
An Empty Room is All We Want: Automatic Defurnishing of Indoor Panoramas: Mira Slavcheva,

Dave Gausebeck,

Kevin Chen,

David Buchhofer,

Azwad Sabik,

Chen Ma,

Sachal Dhillon,

Olaf Brandt,

Alan Dolhasz; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Slavcheva_2024_CVPR, author = {Slavcheva, Mira and Gausebeck, Dave and Chen, Kevin and Buchhofer, David and Sabik, Azwad and Ma, Chen and Dhillon, Sachal and Brandt, Olaf and Dolhasz, Alan}, title = {An Empty Room is All We Want: Automatic Defurnishing of Indoor Panoramas}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7384-7394} }
Can Synthetic Plant Images From Generative Models Facilitate Rare Species Identification and Classification?: Debajyoti Dasgupta,

Arijit Mondal,

Partha P. Chakrabarti; [pdf] [supp]
[bibtex]
@InProceedings{Dasgupta_2024_CVPR, author = {Dasgupta, Debajyoti and Mondal, Arijit and Chakrabarti, Partha P.}, title = {Can Synthetic Plant Images From Generative Models Facilitate Rare Species Identification and Classification?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7530-7540} }
Investigating the Effectiveness of Cross-Attention to Unlock Zero-Shot Editing of Text-to-Video Diffusion Models: Saman Motamed,

Wouter Van Gansbeke,

Luc Van Gool; [pdf] [arXiv]
[bibtex]
@InProceedings{Motamed_2024_CVPR, author = {Motamed, Saman and Van Gansbeke, Wouter and Van Gool, Luc}, title = {Investigating the Effectiveness of Cross-Attention to Unlock Zero-Shot Editing of Text-to-Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7406-7415} }
AI Art Neural Constellation: Revealing the Collective and Contrastive State of AI-Generated and Human Art: Faizan Farooq Khan,

Diana Kim,

Divyansh Jha,

Youssef Mohamed,

Hanna H Chang,

Ahmed Elgammal,

Luba Elliott,

Mohamed Elhoseiny; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Khan_2024_CVPR, author = {Khan, Faizan Farooq and Kim, Diana and Jha, Divyansh and Mohamed, Youssef and Chang, Hanna H and Elgammal, Ahmed and Elliott, Luba and Elhoseiny, Mohamed}, title = {AI Art Neural Constellation: Revealing the Collective and Contrastive State of AI-Generated and Human Art}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7470-7478} }
GeoGen: Geometry-Aware Generative Modeling via Signed Distance Functions: Salvatore Esposito,

Qingshan Xu,

Kacper Kania,

Charlie Hewitt,

Octave Mariotti,

Lohit Petikam,

Julien Valentin,

Arno Onken,

Oisin Mac Aodha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Esposito_2024_CVPR, author = {Esposito, Salvatore and Xu, Qingshan and Kania, Kacper and Hewitt, Charlie and Mariotti, Octave and Petikam, Lohit and Valentin, Julien and Onken, Arno and Mac Aodha, Oisin}, title = {GeoGen: Geometry-Aware Generative Modeling via Signed Distance Functions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7479-7488} }