@inproceedings{cheng-etal-2025-bayesian,
title = "A {B}ayesian Optimization Approach to Machine Translation Reranking",
author = {Cheng, Julius and
Z{\"u}fle, Maike and
Zouhar, Vil{\'e}m and
Vlachos, Andreas},
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.naacl-long.145/",
pages = "2849--2862",
ISBN = "979-8-89176-189-6",
abstract = "Reranking, or scoring a list of prediction candidates from a machine translation system with an external scoring model and returning the highest-scoring candidate, remains a simple and effective method for improving prediction quality. However, reranking with high quality scoring models can add substantial computational cost to the translation pipeline, which we address in this work by framing list reranking as a Bayesian optimization (BayesOpt) problem over the candidate list, where unknown scores are modeled with a Gaussian process. This algorithm scores candidates iteratively, choosing next candidates by balancing between exploration, choosing to score those that differ from candidates already scored, and exploitation, choosing to score those that resemble high-scoring candidates.This procedure finds high-scoring candidates while scoring only a fraction of the candidates list; given candidate lists of 200 random samples (before deduplication), our method achieves the same CometKiwi score using only 70 scoring evaluations on average compared to scoring a random subset of 180 candidates. We also propose multi-fidelity BayesOpt for list reranking, where scores obtained from a noisier but cheaper proxy scoring model are incorporated into the search process. We show that well-trained distilled proxy scorers can further improve the performance of BayesOpt."
}
Markdown (Informal)
[A Bayesian Optimization Approach to Machine Translation Reranking](https://preview.aclanthology.org/landing_page/2025.naacl-long.145/) (Cheng et al., NAACL 2025)
ACL
- Julius Cheng, Maike Züfle, Vilém Zouhar, and Andreas Vlachos. 2025. A Bayesian Optimization Approach to Machine Translation Reranking. In Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers), pages 2849–2862, Albuquerque, New Mexico. Association for Computational Linguistics.