2nd Workshop on Generative Models for Computer Vision
iEdit: Localised Text-guided Image Editing with Weak Supervision-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bodur_2024_CVPR, author = {Bodur, Rumeysa and Gundogdu, Erhan and Bhattarai, Binod and Kim, Tae-Kyun and Donoser, Michael and Bazzani, Loris}, title = {iEdit: Localised Text-guided Image Editing with Weak Supervision}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7426-7435} }
Efficient Exploration of Image Classifier Failures with Bayesian Optimization and Text-to-Image Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Le_Coz_2024_CVPR, author = {Le Coz, Adrien and Ouertatani, Houssem and Herbin, St\'ephane and Adjed, Faouzi}, title = {Efficient Exploration of Image Classifier Failures with Bayesian Optimization and Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7569-7578} }
GenVideo: One-shot Target-image and Shape Aware Video Editing using T2I Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Harsha_2024_CVPR, author = {Harsha, Sai Sree and Revanur, Ambareesh and Agarwal, Dhwanit and Agrawal, Shradha}, title = {GenVideo: One-shot Target-image and Shape Aware Video Editing using T2I Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7559-7568} }
Robust Disaster Assessment from Aerial Imagery Using Text-to-Image Synthetic Data-
[pdf]
[arXiv]
[bibtex]@InProceedings{Kalluri_2024_CVPR, author = {Kalluri, Tarun and Lee, Jihyeon and Sohn, Kihyuk and Singla, Sahil and Chandraker, Manmohan and Xu, Joseph and Liu, Jeremiah}, title = {Robust Disaster Assessment from Aerial Imagery Using Text-to-Image Synthetic Data}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7449-7459} }
Style Transfer for 2D Talking Head Generation-
[pdf]
[supp]
[bibtex]@InProceedings{Pham_2024_CVPR, author = {Pham, Trong Thang and Do, Tuong and Le, Nhat and Le, Ngan and Nguyen, Hung and Tjiputra, Erman and Tran, Quang and Nguyen, Anh}, title = {Style Transfer for 2D Talking Head Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7500-7509} }
ART-V: Auto-Regressive Text-to-Video Generation with Diffusion Models-
[pdf]
[supp]
[bibtex]@InProceedings{Weng_2024_CVPR, author = {Weng, Wenming and Feng, Ruoyu and Wang, Yanhui and Dai, Qi and Wang, Chunyu and Yin, Dacheng and Zhao, Zhiyuan and Qiu, Kai and Bao, Jianmin and Yuan, Yuhui and Luo, Chong and Zhang, Yueyi and Xiong, Zhiwei}, title = {ART-V: Auto-Regressive Text-to-Video Generation with Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7395-7405} }
LATENTMAN: Generating Consistent Animated Characters using Image Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Eldesokey_2024_CVPR, author = {Eldesokey, Abdelrahman and Wonka, Peter}, title = {LATENTMAN: Generating Consistent Animated Characters using Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7510-7519} }
MixSyn: Compositional Image Synthesis with Fuzzy Masks and Style Fusion-
[pdf]
[supp]
[bibtex]@InProceedings{Demir_2024_CVPR, author = {Demir, Ilke and Ciftci, Umur Aybars}, title = {MixSyn: Compositional Image Synthesis with Fuzzy Masks and Style Fusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7460-7469} }
Gaussian Splatting Decoder for 3D-aware Generative Adversarial Networks-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Barthel_2024_CVPR, author = {Barthel, Florian and Beckmann, Arian and Morgenstern, Wieland and Hilsmann, Anna and Eisert, Peter}, title = {Gaussian Splatting Decoder for 3D-aware Generative Adversarial Networks}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7963-7972} }
Contrastive Clothing and Pose Generation for Cloth-Changing Person Re-Identification-
[pdf]
[bibtex]@InProceedings{Nguyen_2024_CVPR, author = {Nguyen, Vuong D. and Mantini, Pranav and Shah, Shishir K.}, title = {Contrastive Clothing and Pose Generation for Cloth-Changing Person Re-Identification}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7541-7549} }
PQ-VAE: Learning Hierarchical Discrete Representations with Progressive Quantization-
[pdf]
[bibtex]@InProceedings{Huang_2024_CVPR, author = {Huang, Lun and Qiu, Qiang and Sapiro, Guillermo}, title = {PQ-VAE: Learning Hierarchical Discrete Representations with Progressive Quantization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7550-7558} }
OmniControlNet: Dual-stage Integration for Conditional Image Generation-
[pdf]
[arXiv]
[bibtex]@InProceedings{Wang_2024_CVPR, author = {Wang, Yilin and Xu, Haiyang and Zhang, Xiang and Chen, Zeyuan and Sha, Zhizhou and Wang, Zirui and Tu, Zhuowen}, title = {OmniControlNet: Dual-stage Integration for Conditional Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7436-7448} }
StereoDiffusion: Training-Free Stereo Image Generation Using Latent Diffusion Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Wang_2024_CVPR, author = {Wang, Lezhong and Frisvad, Jeppe Revall and Jensen, Mark Bo and Bigdeli, Siavash Arjomand}, title = {StereoDiffusion: Training-Free Stereo Image Generation Using Latent Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7416-7425} }
Segmentation-Free Guidance for Text-to-Image Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Azarian_2024_CVPR, author = {Azarian, Kambiz and Das, Debasmit and Hou, Qiqi and Porikli, Fatih}, title = {Segmentation-Free Guidance for Text-to-Image Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7520-7529} }
Salient Object-Aware Background Generation using Text-Guided Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Eshratifar_2024_CVPR, author = {Eshratifar, Amir Erfan and Soares, Joao V.B. and Thadani, Kapil and Mishra, Shaunak and Kuznetsov, Mikhail and Ku, Yueh-Ning and De Juan, Paloma}, title = {Salient Object-Aware Background Generation using Text-Guided Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7489-7499} }
MVDiff: Scalable and Flexible Multi-view Diffusion for 3D Object Reconstruction from Single-View-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bourigault_2024_CVPR, author = {Bourigault, Emmanuelle and Bourigault, Pauline}, title = {MVDiff: Scalable and Flexible Multi-view Diffusion for 3D Object Reconstruction from Single-View}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7579-7586} }
An Empty Room is All We Want: Automatic Defurnishing of Indoor Panoramas-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Slavcheva_2024_CVPR, author = {Slavcheva, Mira and Gausebeck, Dave and Chen, Kevin and Buchhofer, David and Sabik, Azwad and Ma, Chen and Dhillon, Sachal and Brandt, Olaf and Dolhasz, Alan}, title = {An Empty Room is All We Want: Automatic Defurnishing of Indoor Panoramas}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7384-7394} }
Can Synthetic Plant Images From Generative Models Facilitate Rare Species Identification and Classification?-
[pdf]
[supp]
[bibtex]@InProceedings{Dasgupta_2024_CVPR, author = {Dasgupta, Debajyoti and Mondal, Arijit and Chakrabarti, Partha P.}, title = {Can Synthetic Plant Images From Generative Models Facilitate Rare Species Identification and Classification?}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7530-7540} }
Investigating the Effectiveness of Cross-Attention to Unlock Zero-Shot Editing of Text-to-Video Diffusion Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Motamed_2024_CVPR, author = {Motamed, Saman and Van Gansbeke, Wouter and Van Gool, Luc}, title = {Investigating the Effectiveness of Cross-Attention to Unlock Zero-Shot Editing of Text-to-Video Diffusion Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7406-7415} }
AI Art Neural Constellation: Revealing the Collective and Contrastive State of AI-Generated and Human Art-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Khan_2024_CVPR, author = {Khan, Faizan Farooq and Kim, Diana and Jha, Divyansh and Mohamed, Youssef and Chang, Hanna H and Elgammal, Ahmed and Elliott, Luba and Elhoseiny, Mohamed}, title = {AI Art Neural Constellation: Revealing the Collective and Contrastive State of AI-Generated and Human Art}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7470-7478} }
GeoGen: Geometry-Aware Generative Modeling via Signed Distance Functions-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Esposito_2024_CVPR, author = {Esposito, Salvatore and Xu, Qingshan and Kania, Kacper and Hewitt, Charlie and Mariotti, Octave and Petikam, Lohit and Valentin, Julien and Onken, Arno and Mac Aodha, Oisin}, title = {GeoGen: Geometry-Aware Generative Modeling via Signed Distance Functions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {7479-7488} }