Workshop on Human Motion Generation
Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Mehta_2024_CVPR, author = {Mehta, Shivam and Deichler, Anna and O'regan, Jim and Mo\"ell, Birger and Beskow, Jonas and Henter, Gustav Eje and Alexanderson, Simon}, title = {Fake It to Make It: Using Synthetic Data to Remedy the Data Shortage in Joint Multimodal Speech-and-Gesture Synthesis}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1952-1964} }
A Cross-Dataset Study for Text-based 3D Human Motion Retrieval-
[pdf]
[arXiv]
[bibtex]@InProceedings{Bensabath_2024_CVPR, author = {Bensabath, L\'eore and Petrovich, Mathis and Varol, Gul}, title = {A Cross-Dataset Study for Text-based 3D Human Motion Retrieval}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1932-1940} }
Exploring Text-to-Motion Generation with Human Preference-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Sheng_2024_CVPR, author = {Sheng, Jenny and Lin, Matthieu and Zhao, Andrew and Pruvost, Kevin and Wen, Yu-Hui and Li, Yangguang and Huang, Gao and Liu, Yong-Jin}, title = {Exploring Text-to-Motion Generation with Human Preference}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1888-1899} }
Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Bhattacharya_2024_CVPR, author = {Bhattacharya, Uttaran and Bera, Aniket and Manocha, Dinesh}, title = {Speech2UnifiedExpressions: Synchronous Synthesis of Co-Speech Affective Face and Body Expressions from Affordable Inputs}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1877-1887} }
in2IN: Leveraging Individual Information to Generate Human INteractions-
[pdf]
[supp]
[bibtex]@InProceedings{Ruiz-Ponce_2024_CVPR, author = {Ruiz-Ponce, Pablo and Barquero, German and Palmero, Cristina and Escalera, Sergio and Garc{\'\i}a-Rodr{\'\i}guez, Jos\'e}, title = {in2IN: Leveraging Individual Information to Generate Human INteractions}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1941-1951} }
Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Petrovich_2024_CVPR, author = {Petrovich, Mathis and Litany, Or and Iqbal, Umar and Black, Michael J. and Varol, Gul and Bin Peng, Xue and Rempe, Davis}, title = {Multi-Track Timeline Control for Text-Driven 3D Human Motion Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1911-1921} }
Two-Person Interaction Augmentation with Skeleton Priors-
[pdf]
[supp]
[arXiv]
[bibtex]@InProceedings{Li_2024_CVPR, author = {Li, Baiyi and Ho, Edmond S. L. and Shum, Hubert P. H. and Wang, He}, title = {Two-Person Interaction Augmentation with Skeleton Priors}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1900-1910} }
T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences-
[pdf]
[arXiv]
[bibtex]@InProceedings{Lee_2024_CVPR, author = {Lee, Taeryung and Baradel, Fabien and Lucas, Thomas and Lee, Kyoung Mu and Rogez, Gr\`egory}, title = {T2LM: Long-Term 3D Human Motion Generation from Multiple Sentences}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1867-1876} }
DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures-
[pdf]
[supp]
[bibtex]@InProceedings{Hogue_2024_CVPR, author = {Hogue, Steven and Zhang, Chenxu and Daruger, Hamza and Tian, Yapeng and Guo, Xiaohu}, title = {DiffTED: One-shot Audio-driven TED Talk Video Generation with Diffusion-based Co-speech Gestures}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {1922-1931} }