@inproceedings{kvapilikova-etal-2019-cuni,
title = "{CUNI} Systems for the Unsupervised News Translation Task in {WMT} 2019",
author = "Kvapil{\'i}kov{\'a}, Ivana and
Mach{\'a}{\v{c}}ek, Dominik and
Bojar, Ond{\v{r}}ej",
editor = "Bojar, Ond{\v{r}}ej and
Chatterjee, Rajen and
Federmann, Christian and
Fishel, Mark and
Graham, Yvette and
Haddow, Barry and
Huck, Matthias and
Yepes, Antonio Jimeno and
Koehn, Philipp and
Martins, Andr{\'e} and
Monz, Christof and
Negri, Matteo and
N{\'e}v{\'e}ol, Aur{\'e}lie and
Neves, Mariana and
Post, Matt and
Turchi, Marco and
Verspoor, Karin",
booktitle = "Proceedings of the Fourth Conference on Machine Translation (Volume 2: Shared Task Papers, Day 1)",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/W19-5323/",
doi = "10.18653/v1/W19-5323",
pages = "241--248",
abstract = "In this paper we describe the CUNI translation system used for the unsupervised news shared task of the ACL 2019 Fourth Conference on Machine Translation (WMT19). We follow the strategy of Artetxe ae at. (2018b), creating a seed phrase-based system where the phrase table is initialized from cross-lingual embedding mappings trained on monolingual data, followed by a neural machine translation system trained on synthetic parallel data. The synthetic corpus was produced from a monolingual corpus by a tuned PBMT model refined through iterative back-translation. We further focus on the handling of named entities, i.e. the part of vocabulary where the cross-lingual embedding mapping suffers most. Our system reaches a BLEU score of 15.3 on the German-Czech WMT19 shared task."
}
Markdown (Informal)
[CUNI Systems for the Unsupervised News Translation Task in WMT 2019](https://preview.aclanthology.org/add-emnlp-2024-awards/W19-5323/) (Kvapilíková et al., WMT 2019)
ACL