@inproceedings{bogoychev-chen-2023-terminology,
title = "Terminology-Aware Translation with Constrained Decoding and Large Language Model Prompting",
author = "Bogoychev, Nikolay and
Chen, Pinzhen",
editor = "Koehn, Philipp and
Haddow, Barry and
Kocmi, Tom and
Monz, Christof",
booktitle = "Proceedings of the Eighth Conference on Machine Translation",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.wmt-1.80/",
doi = "10.18653/v1/2023.wmt-1.80",
pages = "890--896",
abstract = "Terminology correctness is important in the downstream application of machine translation, and a prevalent way to ensure this is to inject terminology constraints into a translation system. In our submission to the WMT 2023 terminology translation task, we adopt a translate-then-refine approach which can be domain-independent and requires minimal manual efforts. We annotate random source words with pseudo-terminology translations obtained from word alignment to first train a terminology-aware model. Further, we explore two post-processing methods. First, we use an alignment process to discover whether a terminology constraint has been violated, and if so, we re-decode with the violating word negatively constrained. Alternatively, we leverage a large language model to refine a hypothesis by providing it with terminology constraints. Results show that our terminology-aware model learns to incorporate terminologies effectively, and the large language model refinement process can further improve terminology recall."
}
Markdown (Informal)
[Terminology-Aware Translation with Constrained Decoding and Large Language Model Prompting](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.wmt-1.80/) (Bogoychev & Chen, WMT 2023)
ACL