@inproceedings{he-etal-2023-analyzing,
title = "Analyzing Multi-Sentence Aggregation in Abstractive Summarization via the Shapley Value",
author = "He, Jingyi and
Cao, Meng and
Cheung, Jackie Chi Kit",
editor = "Dong, Yue and
Xiao, Wen and
Wang, Lu and
Liu, Fei and
Carenini, Giuseppe",
booktitle = "Proceedings of the 4th New Frontiers in Summarization Workshop",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2023.newsum-1.12/",
doi = "10.18653/v1/2023.newsum-1.12",
pages = "121--134",
abstract = "Abstractive summarization systems aim to write concise summaries capturing the most essential information of the input document in their own words. One of the ways to achieve this is to gather and combine multiple pieces of information from the source document, a process we call aggregation. Despite its importance, the extent to which both reference summaries in benchmark datasets and system-generated summaries require aggregation is yet unknown. In this work, we propose AggSHAP, a measure of the degree of aggregation in a summary sentence. We show that AggSHAP distinguishes multi-sentence aggregation from single-sentence extraction or paraphrasing through automatic and human evaluations. We find that few reference or model-generated summary sentences have a high degree of aggregation measured by the proposed metric. We also demonstrate negative correlations between AggSHAP and other quality scores of system summaries. These findings suggest the need to develop new tasks and datasets to encourage multi-sentence aggregation in summarization."
}
Markdown (Informal)
[Analyzing Multi-Sentence Aggregation in Abstractive Summarization via the Shapley Value](https://preview.aclanthology.org/fix-sig-urls/2023.newsum-1.12/) (He et al., NewSum 2023)
ACL