1st Workshop on Long Multi-Scene Video Foundations


A Survey on Long-Video Storytelling Generation: Architectures, Consistency, and Cinematic Quality
Mohamed Elmoghany,
Ryan Rossi,
Seunghyun Yoon,
Subhojyoti Mukherjee,
Eslam Mohamed Bakr,
Puneet Mathur,
Gang Wu,
Viet Dac Lai,
Nedim Lipka,
Ruiyi Zhang,
Varun Manjunatha,
Chien Van Nguyen,
Daksh Dangi,
Abel Salinas,
Hongjie Chen,
Xiaolei Huang,
Joe Barrow,
Nesreen Ahmed,
Hoda Eldardiry,
Namyong Park,
Yu Wang,
Zhengzhong Tu,
Thien Huu Nguyen,
Dinesh Manocha,
Mohamed Elhoseiny,
Franck Dernoncourt
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Elmoghany_2025_ICCV, author = {Elmoghany, Mohamed and Rossi, Ryan and Yoon, Seunghyun and Mukherjee, Subhojyoti and Bakr, Eslam Mohamed and Mathur, Puneet and Wu, Gang and Lai, Viet Dac and Lipka, Nedim and Zhang, Ruiyi and Manjunatha, Varun and Van Nguyen, Chien and Dangi, Daksh and Salinas, Abel and Chen, Hongjie and Huang, Xiaolei and Barrow, Joe and Ahmed, Nesreen and Eldardiry, Hoda and Park, Namyong and Wang, Yu and Tu, Zhengzhong and Nguyen, Thien Huu and Manocha, Dinesh and Elhoseiny, Mohamed and Dernoncourt, Franck}, title = {A Survey on Long-Video Storytelling Generation: Architectures, Consistency, and Cinematic Quality}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {7023-7035} }

Reinforcement Learning meets Masked Video Modeling : Trajectory-Guided Adaptive Token Selection
Ayush K. Rai,
Kyle Min,
Tarun Krishna,
Feiyan Hu,
Alan F. Smeaton,
Noel O'connor
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Rai_2025_ICCV, author = {Rai, Ayush K. and Min, Kyle and Krishna, Tarun and Hu, Feiyan and Smeaton, Alan F. and O'connor, Noel}, title = {Reinforcement Learning meets Masked Video Modeling : Trajectory-Guided Adaptive Token Selection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2025}, pages = {7012-7022} }