@inproceedings{gella-etal-2018-dataset,
title = "A Dataset for Telling the Stories of Social Media Videos",
author = "Gella, Spandana and
Lewis, Mike and
Rohrbach, Marcus",
editor = "Riloff, Ellen and
Chiang, David and
Hockenmaier, Julia and
Tsujii, Jun{'}ichi",
booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing",
month = oct # "-" # nov,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/D18-1117/",
doi = "10.18653/v1/D18-1117",
pages = "968--974",
abstract = "Video content on social media platforms constitutes a major part of the communication between people, as it allows everyone to share their stories. However, if someone is unable to consume video, either due to a disability or network bandwidth, this severely limits their participation and communication. Automatically telling the stories using multi-sentence descriptions of videos would allow bridging this gap. To learn and evaluate such models, we introduce VideoStory a new large-scale dataset for video description as a new challenge for multi-sentence video description. Our VideoStory captions dataset is complementary to prior work and contains 20k videos posted publicly on a social media platform amounting to 396 hours of video with 123k sentences, temporally aligned to the video."
}
Markdown (Informal)
[A Dataset for Telling the Stories of Social Media Videos](https://preview.aclanthology.org/jlcl-multiple-ingestion/D18-1117/) (Gella et al., EMNLP 2018)
ACL
- Spandana Gella, Mike Lewis, and Marcus Rohrbach. 2018. A Dataset for Telling the Stories of Social Media Videos. In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pages 968–974, Brussels, Belgium. Association for Computational Linguistics.