@inproceedings{passarotti-etal-2025-harmonizing,
title = "Harmonizing Divergent Lemmatization and Part-of-Speech Tagging Practices for {L}atin Participles through the {L}i{L}a Knowledge Base",
author = "Passarotti, Marco and
Iurescia, Federica and
Ruffolo, Paolo",
editor = "Peng, Siyao and
Rehbein, Ines",
booktitle = "Proceedings of the 19th Linguistic Annotation Workshop (LAW-XIX-2025)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/display_plenaries/2025.law-1.8/",
pages = "103--114",
ISBN = "979-8-89176-262-6",
abstract = "This paper addresses the challenge of divergent lemmatization and part-of-speech (PoS) tagging practices for Latin participles in annotated corpora. We propose a solution through the LiLa Knowledge Base, a Linked Open Data framework designed to unify lexical and textual data for Latin. Using lemmas as the point of connection between distributed textual and lexical resources, LiLa introduces hypolemmas {---} secondary citation forms belonging to a word{'}s inflectional paradigm {---} as a means of reconciling divergent annotations for participles. Rather than advocating a single uniform annotation scheme, LiLa preserves each resource{'}s native guidelines while ensuring that users can retrieve and analyze participial data seamlessly. Via empirical assessments of multiple Latin corpora, we show how the LiLa{'}s integration of lemmas and hypolemmas enables consistent retrieval of participle forms regardless of whether they are categorized as verbal or adjectival."
}
Markdown (Informal)
[Harmonizing Divergent Lemmatization and Part-of-Speech Tagging Practices for Latin Participles through the LiLa Knowledge Base](https://preview.aclanthology.org/display_plenaries/2025.law-1.8/) (Passarotti et al., LAW 2025)
ACL