@inproceedings{jerpelea-etal-2025-dialectal,
title = "Dialectal and Low Resource Machine Translation for {A}romanian",
author = "Jerpelea, Alexandru-Iulius and
Radoi, Alina and
Nisioi, Sergiu",
editor = "Rambow, Owen and
Wanner, Leo and
Apidianaki, Marianna and
Al-Khalifa, Hend and
Eugenio, Barbara Di and
Schockaert, Steven",
booktitle = "Proceedings of the 31st International Conference on Computational Linguistics",
month = jan,
year = "2025",
address = "Abu Dhabi, UAE",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2025.coling-main.481/",
pages = "7209--7228",
abstract = "We present a neural machine translation system that can translate between Romanian, English, and Aromanian (an endangered Eastern Romance language); the first of its kind. BLEU scores range from 17 to 32 depending on the direction and genre of the text. Alongside, we release the biggest known Aromanian-Romanian bilingual corpus, consisting of 80k cleaned sentence pairs. Additional tools such as an agnostic sentence embedder (used for both text mining and automatic evaluation) and a diacritics converter are also presented. Lastly, we describe the online deployment of our quantized model, considering a CPU-driven limited resource scenario."
}
Markdown (Informal)
[Dialectal and Low Resource Machine Translation for Aromanian](https://preview.aclanthology.org/fix-sig-urls/2025.coling-main.481/) (Jerpelea et al., COLING 2025)
ACL