@inproceedings{nieminen-etal-2025-implementing,
title = "Implementing and Evaluating Multi-source Retrieval-Augmented Translation",
author = {Nieminen, Tommi and
Tiedemann, J{\"o}rg and
Virpioja, Sami},
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Tenth Conference on Machine Translation",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.wmt-1.20/",
pages = "327--339",
ISBN = "979-8-89176-341-8",
abstract = "In recent years, neural machine translation (NMT) systems have been integrated with external databases with the aim of improving machine translation (MT) quality and enforcing domain-specific terminology and other conventions in the MT output. Most of the work in incorporating external knowledge with NMT has concentrated on integrating a single source of information, usually either a terminology database or a translation memory. However, in real-life translation scenarios, all relevant knowledge sources should be used in parallel. In this article, we evaluate different methods of integrating external knowledge from multiple sources in a single NMT system. In addition to training single models trained to utilize multiple kinds of information, we also ensemble models that have been trained to utilize a single type of information. We evaluate our models against state-of-the-art LLMs using an extensive purpose-built English to Finnish test suite."
}Markdown (Informal)
[Implementing and Evaluating Multi-source Retrieval-Augmented Translation](https://preview.aclanthology.org/ingest-emnlp/2025.wmt-1.20/) (Nieminen et al., WMT 2025)
ACL