Multi-Modal Learning from Videos


Grounded Video Description
Luowei Zhou,
Yannis Kalantidis,
Xinlei Chen,
Jason Corso,
Marcus Rohrbach
[pdf]
[bibtex]
@InProceedings{Zhou_2019_CVPR_Workshops,
author = {Zhou, Luowei and Kalantidis, Yannis and Chen, Xinlei and Corso, Jason and Rohrbach, Marcus},
title = {Grounded Video Description},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2019}
}

The Emotionally Intelligent Robot: Improving Socially-aware Human Prediction in Crowded Environments
Aniket Bera,
Tanmay Randhavane,
Dinesh Manocha
[pdf]
[bibtex]
@InProceedings{Bera_2019_CVPR_Workshops,
author = {Bera, Aniket and Randhavane, Tanmay and Manocha, Dinesh},
title = {The Emotionally Intelligent Robot: Improving Socially-aware Human Prediction in Crowded Environments},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2019}
}

Self-Supervised Segmentation and Source Separation on Videos
Andrew Rouditchenko,
Hang Zhao,
Chuang Gan,
Josh McDermott,
Antonio Torralba
[pdf]
[bibtex]
@InProceedings{Rouditchenko_2019_CVPR_Workshops,
author = {Rouditchenko, Andrew and Zhao, Hang and Gan, Chuang and McDermott, Josh and Torralba, Antonio},
title = {Self-Supervised Segmentation and Source Separation on Videos},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2019}
}

Adversarial Inference for Multi-Sentence Video Description
Jae Sung Park,
Marcus Rohrbach,
Trevor Darrell,
Anna Rohrbach
[pdf]
[bibtex]
@InProceedings{Park_2019_CVPR_Workshops,
author = {Sung Park, Jae and Rohrbach, Marcus and Darrell, Trevor and Rohrbach, Anna},
title = {Adversarial Inference for Multi-Sentence Video Description},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2019}
}

2.5D Visual Sound
Ruohan Gao,
Kristen Grauman
[pdf]
[bibtex]
@InProceedings{Gao_2019_CVPR_Workshops,
author = {Gao, Ruohan and Grauman, Kristen},
title = {2.5D Visual Sound},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
month = {June},
year = {2019}
}