CVPR 2024 Open Access Repository

Workshop on Human Motion Generation

Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis: Shivam Mehta,

Anna Deichler,

Jim O'regan,

Birger Moëll,

Jonas Beskow,

Gustav Eje Henter,

Simon Alexanderson; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehta_2024_CVPR, author = {Mehta, Shivam and Deichler, Anna and O'regan, Jim and Mo\"ell, Birger and Beskow, Jonas and Henter, Gustav Eje and Alexanderson, Simon}, title = {Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1952-1964} }
A Cross-Dataset Study for Text-based 3D Human Motion Retrieval: Léore Bensabath,

Mathis Petrovich,

Gul Varol; [pdf] [arXiv]
[bibtex]
@InProceedings{Bensabath_2024_CVPR, author = {Bensabath, L\'eore and Petrovich, Mathis and Varol, Gul}, title = {A Cross-Dataset Study for Text-based 3D Human Motion Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1932-1940} }
Exploring Text-to-Motion Generation with Human Preference: Jenny Sheng,

Matthieu Lin,

Andrew Zhao,

Kevin Pruvost,

Yu-Hui Wen,

Yangguang Li,

Gao Huang,

Yong-Jin Liu; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sheng_2024_CVPR, author = {Sheng, Jenny and Lin, Matthieu and Zhao, Andrew and Pruvost, Kevin and Wen, Yu-Hui and Li, Yangguang and Huang, Gao and Liu, Yong-Jin}, title = {Exploring Text-to-Motion Generation with Human Preference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1888-1899} }
Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs: Uttaran Bhattacharya,

Aniket Bera,

Dinesh Manocha; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bhattacharya_2024_CVPR, author = {Bhattacharya, Uttaran and Bera, Aniket and Manocha, Dinesh}, title = {Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1877-1887} }
in2IN: Leveraging Individual Information to Generate Human INteractions: Pablo Ruiz-Ponce,

German Barquero,

Cristina Palmero,

Sergio Escalera,

José García-Rodríguez; [pdf] [supp]
[bibtex]
@InProceedings{Ruiz-Ponce_2024_CVPR, author = {Ruiz-Ponce, Pablo and Barquero, German and Palmero, Cristina and Escalera, Sergio and Garc{\'\i}a-Rodr{\'\i}guez, Jos\'e}, title = {in2IN: Leveraging Individual Information to Generate Human INteractions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1941-1951} }
Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation: Mathis Petrovich,

Or Litany,

Umar Iqbal,

Michael J. Black,

Gul Varol,

Xue Bin Peng,

Davis Rempe; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Petrovich_2024_CVPR, author = {Petrovich, Mathis and Litany, Or and Iqbal, Umar and Black, Michael J. and Varol, Gul and Bin Peng, Xue and Rempe, Davis}, title = {Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1911-1921} }
Two-Person Interaction Augmentation with Skeleton Priors: Baiyi Li,

Edmond S. L. Ho,

Hubert P. H. Shum,

He Wang; [pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2024_CVPR, author = {Li, Baiyi and Ho, Edmond S. L. and Shum, Hubert P. H. and Wang, He}, title = {Two-Person Interaction Augmentation with Skeleton Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1900-1910} }
T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences: Taeryung Lee,

Fabien Baradel,

Thomas Lucas,

Kyoung Mu Lee,

Grègory Rogez; [pdf] [arXiv]
[bibtex]
@InProceedings{Lee_2024_CVPR, author = {Lee, Taeryung and Baradel, Fabien and Lucas, Thomas and Lee, Kyoung Mu and Rogez, Gr\`egory}, title = {T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1867-1876} }
DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures: Steven Hogue,

Chenxu Zhang,

Hamza Daruger,

Yapeng Tian,

Xiaohu Guo; [pdf] [supp]
[bibtex]
@InProceedings{Hogue_2024_CVPR, author = {Hogue, Steven and Zhang, Chenxu and Daruger, Hamza and Tian, Yapeng and Guo, Xiaohu}, title = {DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1922-1931} }