AI for Creative Visual Content Generation, Editing and Understanding
ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Kong_2026_CVPR, author = {Kong, Xianghao and Qi, Qiaosong and Wang, Yuanbin and Chen, Biaolong and Zhang, Aixi and Rao, Anyi}, title = {ProFashion: Prototype-guided Fashion Video Generation with Multiple Reference Images}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6001-6011} }
FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bill_2026_CVPR, author = {Bill, Eric Tillmann and Simsar, Enis and Hofmann, Thomas}, title = {FOCUS: Optimal Control for Multi-Entity World Modeling in Text-to-Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5915-5924} }
DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation-
[pdf]
[bibtex]@InProceedings{Jia_2026_CVPR, author = {Jia, Guoli and Ma, Zhiyuan and Hu, Junyao and Long, Xinwei and Tian, Kai and Zhao, Kaikai and Liu, Zhaoxiang and Wang, Kai and Lian, Shiguang and Zhou, Bowen}, title = {DRA-MTransfer: Physically Realistic Video Motion Transfer with Dual-Grained Re-Adaptation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5979-5990} }
PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning-
[pdf]
[supp]
[bibtex]@InProceedings{Kuruvilla_2026_CVPR, author = {Kuruvilla, Varghese P and J., Harishwar Rao and Sarvadevabhatla, Ravi Kiran}, title = {PLATO++: Pose-Conditioned Part-Aware Object Generation via Residual Structure Learning}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6012-6021} }
Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Yang_2026_CVPR, author = {Yang, Songlin and Kong, Xianghao and Rao, Anyi}, title = {Pseudo-Unification: Entropy Probing Reveals Divergent Information Patterns in Unified Multimodal Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6062-6072} }
Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization-
[pdf]
[bibtex]@InProceedings{Ballal_2026_CVPR, author = {Ballal, Nimay and S, Shylaja S}, title = {Mem-UniVST: Recurrent Gram Memory for Training-Free Temporally Consistent Video Stylization}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5907-5914} }
Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition-
[pdf]
[bibtex]@InProceedings{Mohit_2026_CVPR, author = {Mohit, Mohit and Kumar, Atul and Agarwal, Akshay}, title = {Faces in the Wild: GAN-Driven Normalization for Robust Facial Recognition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6052-6061} }
Towards Design Compositing-
[pdf]
[arXiv]
[bibtex]@InProceedings{Mahajan_2026_CVPR, author = {Mahajan, Abhinav and Tripathy, Abhikhya and Pala, Sudeeksha Reddy and Methi, Vaibhav and Joseph, K J and Srinivasan, Balaji Vasan}, title = {Towards Design Compositing}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6041-6051} }
Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm-
[pdf]
[supp]
[bibtex]@InProceedings{Liu_2026_CVPR, author = {Liu, Xiangrui and Li, Haoxiang and Yang, Yezhou}, title = {Hi-Light: A Path to High-fidelity, High-resolution Video Relighting With A Refined Evaluation Paradigm}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6022-6030} }
Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting-
[pdf]
[supp]
[bibtex]@InProceedings{Hou_2026_CVPR, author = {Hou, Shiqin and Chen, Jiayan and Zhang, Tony and Chen, Baoyang and Rao, Anyi}, title = {Visual Composition Generation of Multi-Source Heterogeneous Concepts--A Practical Study Based on the AIGC Short Film: The Meeting}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5968-5978} }
LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition-
[pdf]
[supp]
[bibtex]@InProceedings{Lungu-Stan_2026_CVPR, author = {Lungu-Stan, Vlad-Constantin and Mironic\u{a}, Ionuț and Georgescu, Mariana-Iuliana}, title = {LaDe: Unified Multi-Layered Graphic Media Generation and Decomposition}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6031-6040} }
Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models-
[pdf]
[bibtex]@InProceedings{Donabauer_2026_CVPR, author = {Donabauer, Pia and Tack, Alexander and Kruschwitz, Udo}, title = {Learning Temporal Relations for Evaluating Instruction-Guided Image Editing in Vision-Language Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5948-5958} }
Temporal Environment-Aware Image Generation via Latent Diffusion-
[pdf]
[supp]
[bibtex]@InProceedings{Kalanat_2026_CVPR, author = {Kalanat, Nasrin and Xie, Yiqun and Li, Yanhua and Jia, Xiaowei}, title = {Temporal Environment-Aware Image Generation via Latent Diffusion}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5991-6000} }
Generating Fit Check Videos with a Handheld Camera-
[pdf]
[supp]
[bibtex]@InProceedings{Chen_2026_CVPR, author = {Chen, Bowei and Curless, Brian and Kemelmacher-Shlizerman, Ira and Seitz, Steven M.}, title = {Generating Fit Check Videos with a Handheld Camera}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5935-5947} }
Diamonds in the Sky: Pareidolic Animals in Clouds-
[pdf]
[bibtex]@InProceedings{Horovicz_2026_CVPR, author = {Horovicz, Miriam and Hel-Or, Yacov and Moses, Yael}, title = {Diamonds in the Sky: Pareidolic Animals in Clouds}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5959-5967} }
LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models-
[pdf]
[supp]
[bibtex]@InProceedings{Butt_2026_CVPR, author = {Butt, Muhammad Atif and Wang, Kai and Vazquez-Corral, Javier and Van De Weijer, Joost}, title = {LumiCtrl: Learning Illuminant Prompts for Lighting Control in Personalized Text-to-Image Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {5925-5934} }
X-Aligner: Composed Visual Retrieval without the Bells and Whistles-
[pdf]
[arXiv]
[bibtex]@InProceedings{Zheng_2026_CVPR, author = {Zheng, Yuqian and Georgescu, Mariana-Iuliana}, title = {X-Aligner: Composed Visual Retrieval without the Bells and Whistles}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2026}, pages = {6073-6082} }

