AI for Creative Visual Content Generation, Editing and Understanding


ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images
Xianghao Kong,
Qiaosong Qi,
Yuanbin Wang,
Biaolong Chen,
Aixi Zhang,
Anyi Rao
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Kong_2026_CVPR, author = {Kong, Xianghao and Qi, Qiaosong and Wang, Yuanbin and Chen, Biaolong and Zhang, Aixi and Rao, Anyi}, title = {ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6001-6011} }

FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation
Eric Tillmann Bill,
Enis Simsar,
Thomas Hofmann
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bill_2026_CVPR, author = {Bill, Eric Tillmann and Simsar, Enis and Hofmann, Thomas}, title = {FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5915-5924} }

DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation
Guoli Jia,
Zhiyuan Ma,
Junyao Hu,
Xinwei Long,
Kai Tian,
Kaikai Zhao,
Zhaoxiang Liu,
Kai Wang,
Shiguang Lian,
Bowen Zhou
[pdf]
[bibtex]
@InProceedings{Jia_2026_CVPR, author = {Jia, Guoli and Ma, Zhiyuan and Hu, Junyao and Long, Xinwei and Tian, Kai and Zhao, Kaikai and Liu, Zhaoxiang and Wang, Kai and Lian, Shiguang and Zhou, Bowen}, title = {DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5979-5990} }

PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning
Varghese P Kuruvilla,
Harishwar Rao J.,
Ravi Kiran Sarvadevabhatla
[pdf] [supp]
[bibtex]
@InProceedings{Kuruvilla_2026_CVPR, author = {Kuruvilla, Varghese P and J., Harishwar Rao and Sarvadevabhatla, Ravi Kiran}, title = {PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6012-6021} }

Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models
Songlin Yang,
Xianghao Kong,
Anyi Rao
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Yang_2026_CVPR, author = {Yang, Songlin and Kong, Xianghao and Rao, Anyi}, title = {Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6062-6072} }

Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization
Nimay Ballal,
Shylaja S S
[pdf]
[bibtex]
@InProceedings{Ballal_2026_CVPR, author = {Ballal, Nimay and S, Shylaja S}, title = {Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5907-5914} }

Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition
Mohit Mohit,
Atul Kumar,
Akshay Agarwal
[pdf]
[bibtex]
@InProceedings{Mohit_2026_CVPR, author = {Mohit, Mohit and Kumar, Atul and Agarwal, Akshay}, title = {Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6052-6061} }

Towards Design Compositing
Abhinav Mahajan,
Abhikhya Tripathy,
Sudeeksha Reddy Pala,
Vaibhav Methi,
K J Joseph,
Balaji Vasan Srinivasan
[pdf] [arXiv]
[bibtex]
@InProceedings{Mahajan_2026_CVPR, author = {Mahajan, Abhinav and Tripathy, Abhikhya and Pala, Sudeeksha Reddy and Methi, Vaibhav and Joseph, K J and Srinivasan, Balaji Vasan}, title = {Towards Design Compositing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6041-6051} }

Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm
Xiangrui Liu,
Haoxiang Li,
Yezhou Yang
[pdf] [supp]
[bibtex]
@InProceedings{Liu_2026_CVPR, author = {Liu, Xiangrui and Li, Haoxiang and Yang, Yezhou}, title = {Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6022-6030} }

Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting
Shiqin Hou,
Jiayan Chen,
Tony Zhang,
Baoyang Chen,
Anyi Rao
[pdf] [supp]
[bibtex]
@InProceedings{Hou_2026_CVPR, author = {Hou, Shiqin and Chen, Jiayan and Zhang, Tony and Chen, Baoyang and Rao, Anyi}, title = {Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5968-5978} }

LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition
Vlad-Constantin Lungu-Stan,
Ionuț Mironică,
Mariana-Iuliana Georgescu
[pdf] [supp]
[bibtex]
@InProceedings{Lungu-Stan_2026_CVPR, author = {Lungu-Stan, Vlad-Constantin and Mironic\u{a}, Ionuț and Georgescu, Mariana-Iuliana}, title = {LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6031-6040} }

Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models
Pia Donabauer,
Alexander Tack,
Udo Kruschwitz
[pdf]
[bibtex]
@InProceedings{Donabauer_2026_CVPR, author = {Donabauer, Pia and Tack, Alexander and Kruschwitz, Udo}, title = {Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5948-5958} }

Temporal Environment-Aware Image Generation via Latent Diffusion
Nasrin Kalanat,
Yiqun Xie,
Yanhua Li,
Xiaowei Jia
[pdf] [supp]
[bibtex]
@InProceedings{Kalanat_2026_CVPR, author = {Kalanat, Nasrin and Xie, Yiqun and Li, Yanhua and Jia, Xiaowei}, title = {Temporal Environment-Aware Image Generation via Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5991-6000} }

Generating Fit Check Videos with a Handheld Camera
Bowei Chen,
Brian Curless,
Ira Kemelmacher-Shlizerman,
Steven M. Seitz
[pdf] [supp]
[bibtex]
@InProceedings{Chen_2026_CVPR, author = {Chen, Bowei and Curless, Brian and Kemelmacher-Shlizerman, Ira and Seitz, Steven M.}, title = {Generating Fit Check Videos with a Handheld Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5935-5947} }

Diamonds in the Sky: Pareidolic Animals in Clouds
Miriam Horovicz,
Yacov Hel-Or,
Yael Moses
[pdf]
[bibtex]
@InProceedings{Horovicz_2026_CVPR, author = {Horovicz, Miriam and Hel-Or, Yacov and Moses, Yael}, title = {Diamonds in the Sky: Pareidolic Animals in Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5959-5967} }

LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models
Muhammad Atif Butt,
Kai Wang,
Javier Vazquez-Corral,
Joost Van De Weijer
[pdf] [supp]
[bibtex]
@InProceedings{Butt_2026_CVPR, author = {Butt, Muhammad Atif and Wang, Kai and Vazquez-Corral, Javier and Van De Weijer, Joost}, title = {LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5925-5934} }

X-Aligner: Composed Visual Retrieval without the Bells and Whistles
Yuqian Zheng,
Mariana-Iuliana Georgescu
[pdf] [arXiv]
[bibtex]
@InProceedings{Zheng_2026_CVPR, author = {Zheng, Yuqian and Georgescu, Mariana-Iuliana}, title = {X-Aligner: Composed Visual Retrieval without the Bells and Whistles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6073-6082} }