CVPR 2026 Open Access Repository

AI for Creative Visual Content Generation, Editing and Understanding

ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images: Xianghao Kong,

Qiaosong Qi,

Yuanbin Wang,

Biaolong Chen,

Aixi Zhang,

Anyi Rao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kong_2026_CVPR, author = {Kong, Xianghao and Qi, Qiaosong and Wang, Yuanbin and Chen, Biaolong and Zhang, Aixi and Rao, Anyi}, title = {ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6001-6011} }
FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation: Eric Tillmann Bill,

Enis Simsar,

Thomas Hofmann; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bill_2026_CVPR, author = {Bill, Eric Tillmann and Simsar, Enis and Hofmann, Thomas}, title = {FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5915-5924} }
DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation: Guoli Jia,

Zhiyuan Ma,

Junyao Hu,

Xinwei Long,

Kai Tian,

Kaikai Zhao,

Zhaoxiang Liu,

Kai Wang,

Shiguang Lian,

Bowen Zhou; [pdf]
[bibtex]
@InProceedings{Jia_2026_CVPR, author = {Jia, Guoli and Ma, Zhiyuan and Hu, Junyao and Long, Xinwei and Tian, Kai and Zhao, Kaikai and Liu, Zhaoxiang and Wang, Kai and Lian, Shiguang and Zhou, Bowen}, title = {DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5979-5990} }
PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning: Varghese P Kuruvilla,

Harishwar Rao J.,

Ravi Kiran Sarvadevabhatla; [pdf] [supp]
[bibtex]
@InProceedings{Kuruvilla_2026_CVPR, author = {Kuruvilla, Varghese P and J., Harishwar Rao and Sarvadevabhatla, Ravi Kiran}, title = {PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6012-6021} }
Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models: Songlin Yang,

Xianghao Kong,

Anyi Rao; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2026_CVPR, author = {Yang, Songlin and Kong, Xianghao and Rao, Anyi}, title = {Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6062-6072} }
Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization: Nimay Ballal,

Shylaja S S; [pdf]
[bibtex]
@InProceedings{Ballal_2026_CVPR, author = {Ballal, Nimay and S, Shylaja S}, title = {Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5907-5914} }
Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition: Mohit Mohit,

Atul Kumar,

Akshay Agarwal; [pdf]
[bibtex]
@InProceedings{Mohit_2026_CVPR, author = {Mohit, Mohit and Kumar, Atul and Agarwal, Akshay}, title = {Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6052-6061} }
Towards Design Compositing: Abhinav Mahajan,

Abhikhya Tripathy,

Sudeeksha Reddy Pala,

Vaibhav Methi,

K J Joseph,

Balaji Vasan Srinivasan; [pdf] [arXiv]
[bibtex]
@InProceedings{Mahajan_2026_CVPR, author = {Mahajan, Abhinav and Tripathy, Abhikhya and Pala, Sudeeksha Reddy and Methi, Vaibhav and Joseph, K J and Srinivasan, Balaji Vasan}, title = {Towards Design Compositing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6041-6051} }
Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm: Xiangrui Liu,

Haoxiang Li,

Yezhou Yang; [pdf] [supp]
[bibtex]
@InProceedings{Liu_2026_CVPR, author = {Liu, Xiangrui and Li, Haoxiang and Yang, Yezhou}, title = {Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6022-6030} }
Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting: Shiqin Hou,

Jiayan Chen,

Tony Zhang,

Baoyang Chen,

Anyi Rao; [pdf] [supp]
[bibtex]
@InProceedings{Hou_2026_CVPR, author = {Hou, Shiqin and Chen, Jiayan and Zhang, Tony and Chen, Baoyang and Rao, Anyi}, title = {Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5968-5978} }
LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition: Vlad-Constantin Lungu-Stan,

Ionuț Mironică,

Mariana-Iuliana Georgescu; [pdf] [supp]
[bibtex]
@InProceedings{Lungu-Stan_2026_CVPR, author = {Lungu-Stan, Vlad-Constantin and Mironic\u{a}, Ionuț and Georgescu, Mariana-Iuliana}, title = {LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6031-6040} }
Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models: Pia Donabauer,

Alexander Tack,

Udo Kruschwitz; [pdf]
[bibtex]
@InProceedings{Donabauer_2026_CVPR, author = {Donabauer, Pia and Tack, Alexander and Kruschwitz, Udo}, title = {Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5948-5958} }
Temporal Environment-Aware Image Generation via Latent Diffusion: Nasrin Kalanat,

Yiqun Xie,

Yanhua Li,

Xiaowei Jia; [pdf] [supp]
[bibtex]
@InProceedings{Kalanat_2026_CVPR, author = {Kalanat, Nasrin and Xie, Yiqun and Li, Yanhua and Jia, Xiaowei}, title = {Temporal Environment-Aware Image Generation via Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5991-6000} }
Generating Fit Check Videos with a Handheld Camera: Bowei Chen,

Brian Curless,

Ira Kemelmacher-Shlizerman,

Steven M. Seitz; [pdf] [supp]
[bibtex]
@InProceedings{Chen_2026_CVPR, author = {Chen, Bowei and Curless, Brian and Kemelmacher-Shlizerman, Ira and Seitz, Steven M.}, title = {Generating Fit Check Videos with a Handheld Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5935-5947} }
Diamonds in the Sky: Pareidolic Animals in Clouds: Miriam Horovicz,

Yacov Hel-Or,

Yael Moses; [pdf]
[bibtex]
@InProceedings{Horovicz_2026_CVPR, author = {Horovicz, Miriam and Hel-Or, Yacov and Moses, Yael}, title = {Diamonds in the Sky: Pareidolic Animals in Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5959-5967} }
LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models: Muhammad Atif Butt,

Kai Wang,

Javier Vazquez-Corral,

Joost Van De Weijer; [pdf] [supp]
[bibtex]
@InProceedings{Butt_2026_CVPR, author = {Butt, Muhammad Atif and Wang, Kai and Vazquez-Corral, Javier and Van De Weijer, Joost}, title = {LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5925-5934} }
X-Aligner: Composed Visual Retrieval without the Bells and Whistles: Yuqian Zheng,

Mariana-Iuliana Georgescu; [pdf] [arXiv]
[bibtex]
@InProceedings{Zheng_2026_CVPR, author = {Zheng, Yuqian and Georgescu, Mariana-Iuliana}, title = {X-Aligner: Composed Visual Retrieval without the Bells and Whistles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6073-6082} }