The First Workshop on the Evaluation of Generative Foundation Models


T2VBench: Benchmarking Temporal Dynamics for Text-to-Video Generation
Pengliang Ji,
Chuyang Xiao,
Huilin Tai,
Mingxiao Huo
[pdf]
[bibtex]
@InProceedings{Ji_2024_CVPR, author = {Ji, Pengliang and Xiao, Chuyang and Tai, Huilin and Huo, Mingxiao}, title = {T2VBench: Benchmarking Temporal Dynamics for Text-to-Video Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {5325-5335} }

Diagnostic Benchmark and Iterative Inpainting for Layout-Guided Image Generation
Jaemin Cho,
Linjie Li,
Zhengyuan Yang,
Zhe Gan,
Lijuan Wang,
Mohit Bansal
[pdf] [supp] [arXiv]
[bibtex]
@InProceedings{Cho_2024_CVPR, author = {Cho, Jaemin and Li, Linjie and Yang, Zhengyuan and Gan, Zhe and Wang, Lijuan and Bansal, Mohit}, title = {Diagnostic Benchmark and Iterative Inpainting for Layout-Guided Image Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {5280-5289} }

TlTScore: Towards Long-Tail Effects in Text-to-Visual Evaluation with Generative Foundation Models
Pengliang Ji,
Junchen Liu
[pdf]
[bibtex]
@InProceedings{Ji_2024_CVPR, author = {Ji, Pengliang and Liu, Junchen}, title = {TlTScore: Towards Long-Tail Effects in Text-to-Visual Evaluation with Generative Foundation Models}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {5302-5313} }

Evaluating and Improving Compositional Text-to-Visual Generation
Baiqi Li,
Zhiqiu Lin,
Deepak Pathak,
Jiayao Li,
Yixin Fei,
Kewen Wu,
Xide Xia,
Pengchuan Zhang,
Graham Neubig,
Deva Ramanan
[pdf] [supp]
[bibtex]
@InProceedings{Li_2024_CVPR, author = {Li, Baiqi and Lin, Zhiqiu and Pathak, Deepak and Li, Jiayao and Fei, Yixin and Wu, Kewen and Xia, Xide and Zhang, Pengchuan and Neubig, Graham and Ramanan, Deva}, title = {Evaluating and Improving Compositional Text-to-Visual Generation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {5290-5301} }

Evaluating Multimodal Large Language Models Across Distribution Shifts and Augmentations
Aayush Atul Verma,
Amir Saeidi,
Shamanthak Hegde,
Ajay Therala,
Fenil Denish Bardoliya,
Nagaraju Machavarapu,
Shri Ajay Kumar Ravindhiran,
Srija Malyala,
Agneet Chatterjee,
Yezhou Yang,
Chitta Baral
[pdf]
[bibtex]
@InProceedings{Verma_2024_CVPR, author = {Verma, Aayush Atul and Saeidi, Amir and Hegde, Shamanthak and Therala, Ajay and Bardoliya, Fenil Denish and Machavarapu, Nagaraju and Ravindhiran, Shri Ajay Kumar and Malyala, Srija and Chatterjee, Agneet and Yang, Yezhou and Baral, Chitta}, title = {Evaluating Multimodal Large Language Models Across Distribution Shifts and Augmentations}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, month = {June}, year = {2024}, pages = {5314-5324} }