@inproceedings{asadpour-etal-2025-practical,
title = "A Practical Tool to Help Automate Interlinear Glossing: a Study on Mukr{\={i}} {K}urdish",
author = "Asadpour, Hiwa and
Okabe, Shu and
Fraser, Alexander",
editor = "Le Ferrand, {\'E}ric and
Klyachko, Elena and
Postnikova, Anna and
Shavrina, Tatiana and
Serikov, Oleg and
Voloshina, Ekaterina and
Vylomova, Ekaterina",
booktitle = "Proceedings of the Fourth Workshop on NLP Applications to Field Linguistics",
month = aug,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/transition-to-people-yaml/2025.fieldmatters-1.6/",
pages = "65--75",
ISBN = "979-8-89176-282-4",
abstract = "Interlinear gloss generation aims to predict linguistic annotations (gloss) for a sentence in a language that is usually under ongoing documentation. Such output is a first draft for the linguist to work with and should reduce the manual workload.This article studies a simple glossing pipeline based on a Conditional Random Field and applies it to a small fieldwork corpus in Mukr{\={i}} Kurdish, a variety of Central Kurdish.We mainly focus on making the tool as accessible as possible for field linguists, so it can run on standard computers without the need for GPUs. Our pipeline predicts common grammatical patterns robustly and, more generally, frequent combinations of morphemes and glosses. Although more advanced neural models do reach better results, our feature-based system still manages to be competitive and to provide interpretability.To foster further collaboration between field linguistics and NLP, we also provide some recommendations regarding documentation endeavours and release our pipeline code alongside."
}
Markdown (Informal)
[A Practical Tool to Help Automate Interlinear Glossing: a Study on Mukrī Kurdish](https://preview.aclanthology.org/transition-to-people-yaml/2025.fieldmatters-1.6/) (Asadpour et al., FieldMatters 2025)
ACL