@inproceedings{winkle-etal-2026-generative-information,
title = "Generative Information Extraction from Biographical Sources",
author = {Winkle, Robin and
Stede, Manfred and
Kreutel, J{\"o}rn},
editor = "Alves, Diego and
Bizzoni, Yuri and
Degaetano-Ortlieb, Stefania and
Kazantseva, Anna and
Pagel, Janis and
Szpakowicz, Stan",
booktitle = "Proceedings of the 10th Joint {SIGHUM} Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature 2026",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.latechclfl-1.30/",
pages = "311--322",
ISBN = "979-8-89176-373-9",
abstract = "Biographical sources, such as literature encyclopedias, encode knowledge about historical figures in textual form. In this paper, we address the task of consolidating structured biographical information about authors from the former German Democratic Republic into a unified database. To this end, we present a generalizable Information Extraction (IE) system based on LLM prompting. Specifically, we compare two midsized open-source models, Qwen-2.5-32B and Llama-3-70B-Instruct, investigate a range of Prompt Engineering (PE) strategies, and propose a semantic similarity-based evaluation metric for open-ended IE. Our experiments on an unpublished annotated subset of biographical texts deliver moderate precision and variable recall, highlighting both the potential and current limitations of generative IE in the Digital Humanities."
}Markdown (Informal)
[Generative Information Extraction from Biographical Sources](https://preview.aclanthology.org/ingest-eacl/2026.latechclfl-1.30/) (Winkle et al., LaTeCH-CLfL 2026)
ACL
- Robin Winkle, Manfred Stede, and Jörn Kreutel. 2026. Generative Information Extraction from Biographical Sources. In Proceedings of the 10th Joint SIGHUM Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature 2026, pages 311–322, Rabat, Morocco. Association for Computational Linguistics.