Workshop on Human Motion Generation


Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis
Shivam Mehta,
Anna Deichler,
Jim O'regan,
Birger Moëll,
Jonas Beskow,
Gustav Eje Henter,
Simon Alexanderson
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Mehta_2024_CVPR, author = {Mehta, Shivam and Deichler, Anna and O'regan, Jim and Mo\"ell, Birger and Beskow, Jonas and Henter, Gustav Eje and Alexanderson, Simon}, title = {Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1952-1964} }

A Cross-Dataset Study for Text-based 3D Human Motion Retrieval
Léore Bensabath,
Mathis Petrovich,
Gul Varol
[pdf] [arXiv]
[bibtex]
@InProceedings{Bensabath_2024_CVPR, author = {Bensabath, L\'eore and Petrovich, Mathis and Varol, Gul}, title = {A Cross-Dataset Study for Text-based 3D Human Motion Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1932-1940} }

Exploring Text-to-Motion Generation with Human Preference
Jenny Sheng,
Matthieu Lin,
Andrew Zhao,
Kevin Pruvost,
Yu-Hui Wen,
Yangguang Li,
Gao Huang,
Yong-Jin Liu
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Sheng_2024_CVPR, author = {Sheng, Jenny and Lin, Matthieu and Zhao, Andrew and Pruvost, Kevin and Wen, Yu-Hui and Li, Yangguang and Huang, Gao and Liu, Yong-Jin}, title = {Exploring Text-to-Motion Generation with Human Preference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1888-1899} }

Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs
Uttaran Bhattacharya,
Aniket Bera,
Dinesh Manocha
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Bhattacharya_2024_CVPR, author = {Bhattacharya, Uttaran and Bera, Aniket and Manocha, Dinesh}, title = {Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1877-1887} }

in2IN: Leveraging Individual Information to Generate Human INteractions
Pablo Ruiz-Ponce,
German Barquero,
Cristina Palmero,
Sergio Escalera,
José García-Rodríguez
[pdf] [supp]
[bibtex]
@InProceedings{Ruiz-Ponce_2024_CVPR, author = {Ruiz-Ponce, Pablo and Barquero, German and Palmero, Cristina and Escalera, Sergio and Garc{\'\i}a-Rodr{\'\i}guez, Jos\'e}, title = {in2IN: Leveraging Individual Information to Generate Human INteractions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1941-1951} }

Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation
Mathis Petrovich,
Or Litany,
Umar Iqbal,
Michael J. Black,
Gul Varol,
Xue Bin Peng,
Davis Rempe
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Petrovich_2024_CVPR, author = {Petrovich, Mathis and Litany, Or and Iqbal, Umar and Black, Michael J. and Varol, Gul and Bin Peng, Xue and Rempe, Davis}, title = {Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1911-1921} }

Two-Person Interaction Augmentation with Skeleton Priors
Baiyi Li,
Edmond S. L. Ho,
Hubert P. H. Shum,
He Wang
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Li_2024_CVPR, author = {Li, Baiyi and Ho, Edmond S. L. and Shum, Hubert P. H. and Wang, He}, title = {Two-Person Interaction Augmentation with Skeleton Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1900-1910} }

T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences
Taeryung Lee,
Fabien Baradel,
Thomas Lucas,
Kyoung Mu Lee,
Grègory Rogez
[pdf] [arXiv]
[bibtex]
@InProceedings{Lee_2024_CVPR, author = {Lee, Taeryung and Baradel, Fabien and Lucas, Thomas and Lee, Kyoung Mu and Rogez, Gr\`egory}, title = {T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1867-1876} }

DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures
Steven Hogue,
Chenxu Zhang,
Hamza Daruger,
Yapeng Tian,
Xiaohu Guo
[pdf] [supp]
[bibtex]
@InProceedings{Hogue_2024_CVPR, author = {Hogue, Steven and Zhang, Chenxu and Daruger, Hamza and Tian, Yapeng and Guo, Xiaohu}, title = {DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1922-1931} }