@inproceedings{koneru-etal-2025-quality,
title = "Quality-Aware Decoding: Unifying Quality Estimation and Decoding",
author = "Koneru, Sai and
Huck, Matthias and
Exel, Miriam and
Niehues, Jan",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Anastasopoulos, Antonis",
booktitle = "Proceedings of the 22nd International Conference on Spoken Language Translation (IWSLT 2025)",
month = jul,
year = "2025",
address = "Vienna, Austria (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/acl25-workshop-ingestion/2025.iwslt-1.3/",
pages = "33--46",
ISBN = "979-8-89176-272-5",
abstract = "Quality Estimation (QE) models for Neural Machine Translation (NMT) predict the quality of the hypothesis without having access to the reference. An emerging research direction in NMT involves the use of QE models, which have demonstrated high correlations with human judgment and can enhance translations through Quality-Aware Decoding. Although several approaches have been proposed based on sampling multiple candidate translations and picking the best candidate, none have integrated these models directly into the decoding process. In this paper, we address this by proposing a novel token-level QE model capable of reliably scoring partial translations. We build a uni-directional QE model for this, as decoder models are inherently trained and efficient on partial sequences. We then present a decoding strategy that integrates the QE model for Quality-Aware decoding and demonstrate that the translation quality improves when compared to the N-best list re-ranking with state-of-the-art QE models (up to 1.39 XCOMET-XXL). Finally, we show that our approach provides significant benefits in document translation tasks, where the quality of N-best lists is typically suboptimal. Code can be found at https://github.com/SAP-samples/quality-aware-decoding-translation."
}
Markdown (Informal)
[Quality-Aware Decoding: Unifying Quality Estimation and Decoding](https://preview.aclanthology.org/acl25-workshop-ingestion/2025.iwslt-1.3/) (Koneru et al., IWSLT 2025)
ACL
- Sai Koneru, Matthias Huck, Miriam Exel, and Jan Niehues. 2025. Quality-Aware Decoding: Unifying Quality Estimation and Decoding. In Proceedings of the 22nd International Conference on Spoken Language Translation (IWSLT 2025), pages 33–46, Vienna, Austria (in-person and online). Association for Computational Linguistics.