@inproceedings{yu-etal-2017-hierarchically,
title = "Hierarchically-Attentive {RNN} for Album Summarization and Storytelling",
author = "Yu, Licheng and
Bansal, Mohit and
Berg, Tamara",
editor = "Palmer, Martha and
Hwa, Rebecca and
Riedel, Sebastian",
booktitle = "Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing",
month = sep,
year = "2017",
address = "Copenhagen, Denmark",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/D17-1101/",
doi = "10.18653/v1/D17-1101",
pages = "966--971",
abstract = "We address the problem of end-to-end visual storytelling. Given a photo album, our model first selects the most representative (summary) photos, and then composes a natural language story for the album. For this task, we make use of the Visual Storytelling dataset and a model composed of three hierarchically-attentive Recurrent Neural Nets (RNNs) to: encode the album photos, select representative (summary) photos, and compose the story. Automatic and human evaluations show our model achieves better performance on selection, generation, and retrieval than baselines."
}
Markdown (Informal)
[Hierarchically-Attentive RNN for Album Summarization and Storytelling](https://preview.aclanthology.org/jlcl-multiple-ingestion/D17-1101/) (Yu et al., EMNLP 2017)
ACL