@inproceedings{cusenza-coltekin-2024-nlp,
title = {{NLP} for Arb{\"e}resh: How an Endangered Language Learns to Write in the 21st Century},
author = {Cusenza, Giulio and
{\c{C}}{\"o}ltekin, {\c{C}}a{\u{g}}r{\i}},
editor = "Melero, Maite and
Sakti, Sakriani and
Soria, Claudia",
booktitle = "Proceedings of the 3rd Annual Meeting of the Special Interest Group on Under-resourced Languages @ LREC-COLING 2024",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.sigul-1.30/",
pages = "252--256",
abstract = {Societies are becoming more and more connected, and minority languages often find themselves helpless against the advent of the digital age, with their speakers having to regularly turn to other languages for written communication. This work introduces the case of Arb{\"e}resh, a southern Italian language related to Albanian. It presents the very first machine-readable Arb{\"e}resh data, collected through a web campaign, and describes a set of tools developed to enable the Arb{\"e}resh people to learn how to write their language, including a spellchecker, a conjugator, a numeral generator, and an interactive platform to learn Arb{\"e}resh spelling. A comprehensive web application was set up to make these tools available to the public, as well as to collect further data through them. This method can be replicated to help revive other minority languages in a situation similar to Arb{\"e}resh`s. The main challenges of the process were the extremely low-resource setting and the variability of Arb{\"e}resh dialects.}
}
Markdown (Informal)
[NLP for Arbëresh: How an Endangered Language Learns to Write in the 21st Century](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.sigul-1.30/) (Cusenza & Çöltekin, SIGUL 2024)
ACL