@inproceedings{veitsman-hartmann-2025-recent,
title = "Recent Advancements and Challenges of {T}urkic {C}entral {A}sian Language Processing",
author = "Veitsman, Yana and
Hartmann, Mareike",
editor = "Hettiarachchi, Hansi and
Ranasinghe, Tharindu and
Rayson, Paul and
Mitkov, Ruslan and
Gaber, Mohamed and
Premasiri, Damith and
Tan, Fiona Anting and
Uyangodage, Lasitha",
booktitle = "Proceedings of the First Workshop on Language Models for Low-Resource Languages",
month = jan,
year = "2025",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.loreslm-1.25/",
pages = "309--324",
abstract = "Research in NLP for Central Asian Turkic languages - Kazakh, Uzbek, Kyrgyz, and Turkmen - faces typical low-resource language challenges like data scarcity, limited linguistic resources and technology development. However, recent advancements have included the collection of language-specific datasets and the development of models for downstream tasks. Thus, this paper aims to summarize recent progress and identify future research directions. It provides a high-level overview of each language{'}s linguistic features, the current technology landscape, the application of transfer learning from higher-resource languages, and the availability of labeled and unlabeled data. By outlining the current state, we hope to inspire and facilitate future research."
}
Markdown (Informal)
[Recent Advancements and Challenges of Turkic Central Asian Language Processing](https://preview.aclanthology.org/fix-sig-urls/2025.loreslm-1.25/) (Veitsman & Hartmann, LoResLM 2025)
ACL