@inproceedings{zagidov-brochhagen-2026-avarlab,
title = "{A}var{L}ab: An Integrated Digital Ecosystem for {A}var, a Morphologically Rich Low-Resource Language",
author = "Zagidov, Kebed and
Brochhagen, Thomas",
editor = "Agyapong, Godfred and
Moeller, Sarah and
Arppe, Antti and
Marashian, Ali and
Rosenblum, Daisy",
booktitle = "Proceedings of the Ninth Workshop on the Use of Computational Methods in the Study of Endangered Languages ({C}omput{EL}-9)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.computel-1.7/",
pages = "62--71",
ISBN = "979-8-89176-422-4",
abstract = "This paper presents a digital ecosystem designed for Avar, a morphologically rich and vulnerable Northeast Caucasian language. Addressing the common bottleneck where lexical resources, corpora, and computational tools are developed in isolation or are entirely absent, we propose the ``generate-verify'' workflow. By developing a scalable, rule-based computational architecture, our system specifically targets the challenges of low-resource settings, overcoming data sparsity to generate over one million inflected forms from a static dictionary of 14,700 entries.Furthermore, by coupling morphological generation with corpus verification, we introduce a dynamic method to rapidly analyze and expand endangered language data. This approach transforms static linguistic documentation into active language reclamation tools, supporting dictionary lookup and the creation of silver-standard annotations for downstream NLP. The platform also serves as a unified model for the collection, management, and mobilization of fragmented language data, ensuring that the resulting resources are directly accessible and beneficial to the speaker community. Ultimately, AvarLab provides a practical, adaptable pathway for building sustainable digital infrastructure by fostering interaction among documentary linguists, computer scientists, and native speakers."
}Markdown (Informal)
[AvarLab: An Integrated Digital Ecosystem for Avar, a Morphologically Rich Low-Resource Language](https://preview.aclanthology.org/ingest-acl-workshops/2026.computel-1.7/) (Zagidov & Brochhagen, ComputEL 2026)
ACL