@inproceedings{post-palmer-2026-linguistic,
title = "Linguistic Feature Tagging for Automatic Classification of 27 Closely-Related {Q}uechua Varieties",
author = "Post, Claire and
Palmer, Alexis",
editor = "Mager, Manuel and
Ebrahimi, Abteen and
Bui, Minh Duc and
Pugh, Robert and
Oncevay, Arturo and
Chiruzzo, Luis and
Solano, Rolando Coto and
Rijhwani, Shruti and
Von Der Wense, Katharina",
booktitle = "Proceedings of the Sixth Workshop on {NLP} for Indigenous Languages of the {A}mericas ({A}mericas{NLP})",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.americasnlp-6.5/",
pages = "46--63",
ISBN = "979-8-89176-415-6",
abstract = "This paper presents a multi-dialect text classifier for Quechua that augments neural models with rule-based linguistic information to address challenges in low-resource, morphologically complex settings. The approach is built on a carefully curated dataset spanning multiple genres, including annotated parallel bible corpora, and encodes manually annotated lexical variation and polypersonal verbal agreement as explicit features within a transformer-based classifier. Results show that neural models substantially outperform statistical baselines, enabling highly accurate multi-class classification across 27 Quechua dialects. The impact of linguistic augmentation is context-dependent: gains are minimal in high-resource settings but more pronounced in low-resource and cross-domain conditions. Overall, this work aims to contribute to the development of dialect-sensitive NLP methods for Quechua and other low-resource, morphologically rich languages."
}Markdown (Informal)
[Linguistic Feature Tagging for Automatic Classification of 27 Closely-Related Quechua Varieties](https://preview.aclanthology.org/ingest-acl-workshops/2026.americasnlp-6.5/) (Post & Palmer, AmericasNLP 2026)
ACL