@inproceedings{gholipour-ghalandari-2017-revisiting,
title = "Revisiting the Centroid-based Method: A Strong Baseline for Multi-Document Summarization",
author = "Gholipour Ghalandari, Demian",
editor = "Wang, Lu and
Cheung, Jackie Chi Kit and
Carenini, Giuseppe and
Liu, Fei",
booktitle = "Proceedings of the Workshop on New Frontiers in Summarization",
month = sep,
year = "2017",
address = "Copenhagen, Denmark",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/W17-4511/",
doi = "10.18653/v1/W17-4511",
pages = "85--90",
abstract = "The centroid-based model for extractive document summarization is a simple and fast baseline that ranks sentences based on their similarity to a centroid vector. In this paper, we apply this ranking to possible summaries instead of sentences and use a simple greedy algorithm to find the best summary. Furthermore, we show possibilities to scale up to larger input document collections by selecting a small number of sentences from each document prior to constructing the summary. Experiments were done on the DUC2004 dataset for multi-document summarization. We observe a higher performance over the original model, on par with more complex state-of-the-art methods."
}
Markdown (Informal)
[Revisiting the Centroid-based Method: A Strong Baseline for Multi-Document Summarization](https://preview.aclanthology.org/jlcl-multiple-ingestion/W17-4511/) (Gholipour Ghalandari, 2017)
ACL