AI for Creative Video Editing and Understanding
Benchmarking Data Efficiency and Computational Efficiency of Temporal Action Localization Models-
[pdf]
[arXiv]
[bibtex]@InProceedings{Warchocki_2023_ICCV, author = {Warchocki, Jan and Oprescu, Teodor and Wang, Yunhan and D\u{a}m\u{a}cu\c{s}, Alexandru and Misterka, Paul and Bruintjes, Robert-Jan and Lengyel, Attila and Strafforello, Ombretta and van Gemert, Jan}, title = {Benchmarking Data Efficiency and Computational Efficiency of Temporal Action Localization Models}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {3008-3016} }
Is There Progress in Activity Progress Prediction?-
[pdf]
[arXiv]
[bibtex]@InProceedings{de_Boer_2023_ICCV, author = {de Boer, Frans and van Gemert, Jan C. and Dijkstra, Jouke and Pintea, Silvia L.}, title = {Is There Progress in Activity Progress Prediction?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2958-2966} }
InFusion: Inject and Attention Fusion for Multi Concept Zero-Shot Text-Based Video Editing-
[pdf]
[arXiv]
[bibtex]@InProceedings{Khandelwal_2023_ICCV, author = {Khandelwal, Anant}, title = {InFusion: Inject and Attention Fusion for Multi Concept Zero-Shot Text-Based Video Editing}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {3017-3026} }
PAT: Position-Aware Transformer for Dense Multi-Label Action Detection-
[pdf]
[arXiv]
[bibtex]@InProceedings{Sardari_2023_ICCV, author = {Sardari, Faegheh and Mustafa, Armin and Jackson, Philip J. B. and Hilton, Adrian}, title = {PAT: Position-Aware Transformer for Dense Multi-Label Action Detection}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2988-2997} }
Expressive Talking Head Video Encoding in StyleGAN2 Latent Space-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Oorloff_2023_ICCV, author = {Oorloff, Trevine and Yacoob, Yaser}, title = {Expressive Talking Head Video Encoding in StyleGAN2 Latent Space}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2998-3007} }
Are Current Long-Term Video Understanding Datasets Long-Term?-
[pdf]
[arXiv]
[bibtex]@InProceedings{Strafforello_2023_ICCV, author = {Strafforello, Ombretta and Schutte, Klamer and van Gemert, Jan}, title = {Are Current Long-Term Video Understanding Datasets Long-Term?}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2967-2976} }
VAST: Vivify Your Talking Avatar via Zero-Shot Expressive Facial Style Transfer-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Chen_2023_ICCV, author = {Chen, Liyang and Wu, Zhiyong and Li, Runnan and Bao, Weihong and Ling, Jun and Tan, Xu and Zhao, Sheng}, title = {VAST: Vivify Your Talking Avatar via Zero-Shot Expressive Facial Style Transfer}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {2977-2987} }
LEMMS: Label Estimation of Multi-Feature Movie Segments-
[pdf]
[bibtex]@InProceedings{Vacchetti_2023_ICCV, author = {Vacchetti, Bartolomeo and Mureja, Dawit and Cerquitelli, Tania}, title = {LEMMS: Label Estimation of Multi-Feature Movie Segments}, booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV) Workshops}, month = {October}, year = {2023}, pages = {3027-3035} }