@inproceedings{mus-etal-2025-creating,
title = "Creating a multi-layer Treebank for Tundra {N}enets",
author = "Mus, Nikolett and
Guillaume, Bruno and
Kahane, Sylvain and
Zeman, Daniel",
editor = {H{\"a}m{\"a}l{\"a}inen, Mika and
Rie{\ss}ler, Michael and
Morooka, Eiaki V. and
Kharlashkin, Lev},
booktitle = "Proceedings of the 10th International Workshop on Computational Linguistics for Uralic Languages",
month = dec,
year = "2025",
address = "Joensuu, Finland",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/corrections-2026-01/2025.iwclul-1.11/",
pages = "77--86",
ISBN = "979-8-89176-360-9",
abstract = "This paper presents the development of the Tundra Nenets Universal Dependencies (UD) Treebank, the first syntactically annotated resource for the Samoyedic branch of the Uralic family. The treebank integrates spoken-language data and adopts the morphologically enhanced Surface-Syntactic UD (mSUD) framework to capture inflectional morphology and morphology-based syntactic relations. It further incorporates Information Structure annotation. The methodological workflow includes data selection, transcription conventions, sentence and lexeme segmentation, annotation of spoken-language features, lemmatization, treatment of morpheme status, part-of-speech and morphological tagging, and syntactic annotation based on the functional and distributional properties of syntactic elements. We also outline the principles guiding multi-level annotation and justify the theoretical choices underlying the integration of prosodic, morphological, and syntactic information."
}Markdown (Informal)
[Creating a multi-layer Treebank for Tundra Nenets](https://preview.aclanthology.org/corrections-2026-01/2025.iwclul-1.11/) (Mus et al., IWCLUL 2025)
ACL
- Nikolett Mus, Bruno Guillaume, Sylvain Kahane, and Daniel Zeman. 2025. Creating a multi-layer Treebank for Tundra Nenets. In Proceedings of the 10th International Workshop on Computational Linguistics for Uralic Languages, pages 77–86, Joensuu, Finland. Association for Computational Linguistics.