@inproceedings{ponce-etal-2024-vicomtech,
title = "Vicomtech@{WMT} 2024: Shared Task on Translation into Low-Resource Languages of {S}pain",
author = "Ponce, David and
Gete, Harritxu and
Etchegoyhen, Thierry",
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Ninth Conference on Machine Translation",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.wmt-1.91/",
doi = "10.18653/v1/2024.wmt-1.91",
pages = "934--942",
abstract = "We describe Vicomtech`s participation in the WMT 2024 Shared Task on translation into low-resource languages of Spain. We addressed all three languages of the task, namely Aragonese, Aranese and Asturian, in both constrained and open settings. Our work mainly centred on exploiting different types of corpora via data filtering, selection and combination methods, along with synthetic data generated with translation models based on rules, neural sequence-to-sequence or large language models. We improved or matched the best baselines in all three language pairs and present complementary results on additional test sets."
}
Markdown (Informal)
[Vicomtech@WMT 2024: Shared Task on Translation into Low-Resource Languages of Spain](https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.wmt-1.91/) (Ponce et al., WMT 2024)
ACL