@inproceedings{arnold-etal-2025-advances,
title = "Advances and Challenges in the Automatic Identification of Indirect Quotations in Scholarly Texts and Literary Works",
author = {Arnold, Frederik and
J{\"a}schke, Robert and
Kraut, Philip},
editor = {H{\"a}m{\"a}l{\"a}inen, Mika and
{\"O}hman, Emily and
Bizzoni, Yuri and
Miyagawa, So and
Alnajjar, Khalid},
booktitle = "Proceedings of the 5th International Conference on Natural Language Processing for Digital Humanities",
month = may,
year = "2025",
address = "Albuquerque, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.nlp4dh-1.15/",
pages = "179--190",
ISBN = "979-8-89176-234-3",
abstract = "Literary scholars commonly refer to the interpreted literary work using various types of quotations. Two main categories are direct and indirect quotations. In this work we focus on the automatic identification of two subtypes of indirect quotations: paraphrases and summaries. Our contributions are twofold. First, we present a dataset of scholarly works with annotations of text spans which summarize or paraphrase the interpreted drama and the source of the quotation. Second, we present a two-step approach to solve the task at hand. We found the process of annotating large training corpora very time consuming and therefore leverage GPT-generated summaries to generate training data for our approach."
}
Markdown (Informal)
[Advances and Challenges in the Automatic Identification of Indirect Quotations in Scholarly Texts and Literary Works](https://preview.aclanthology.org/fix-sig-urls/2025.nlp4dh-1.15/) (Arnold et al., NLP4DH 2025)
ACL