@inproceedings{christou-tsoumakas-2025-artificial,
title = "Artificial Relationships in Fiction: A Dataset for Advancing {NLP} in Literary Domains",
author = "Christou, Despina and
Tsoumakas, Grigorios",
editor = "Kazantseva, Anna and
Szpakowicz, Stan and
Degaetano-Ortlieb, Stefania and
Bizzoni, Yuri and
Pagel, Janis",
booktitle = "Proceedings of the 9th Joint SIGHUM Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature (LaTeCH-CLfL 2025)",
month = may,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.latechclfl-1.13/",
pages = "130--147",
ISBN = "979-8-89176-241-1",
abstract = "Relation extraction (RE) in fiction presents unique NLP challenges due to implicit, narrative-driven relationships. Unlike factual texts, fiction weaves complex connections, yet existing RE datasets focus on non-fiction. To address this, we introduce Artificial Relationships in Fiction (ARF), a synthetically annotated dataset for literary RE. Built from diverse Project Gutenberg fiction, ARF considers author demographics, publication periods, and themes. We curated an ontology for fiction-specific entities and relations, and using GPT-4o, generated artificial relationships to capture narrative complexity. Our analysis demonstrates its value for finetuning RE models and advancing computational literary studies. By bridging a critical RE gap, ARF enables deeper exploration of fictional relationships, enriching NLP research at the intersection of storytelling and AI-driven literary analysis."
}
Markdown (Informal)
[Artificial Relationships in Fiction: A Dataset for Advancing NLP in Literary Domains](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.latechclfl-1.13/) (Christou & Tsoumakas, LaTeCHCLfL 2025)
ACL