@inproceedings{post-hoang-2025-effects,
title = "Effects of automatic alignment on speech translation metrics",
author = "Post, Matt and
Hoang, Hieu",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Anastasopoulos, Antonis",
booktitle = "Proceedings of the 22nd International Conference on Spoken Language Translation (IWSLT 2025)",
month = jul,
year = "2025",
address = "Vienna, Austria (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.iwslt-1.7/",
pages = "84--92",
ISBN = "979-8-89176-272-5",
abstract = "Research in speech translation (ST) often operates in a setting where human segmentations of the input audio are provided. This simplifying assumption avoids the evaluation-time difficulty of aligning the translated outputs to their references for segment-level evaluation, but it also means that the systems are not evaluated as they will be used in production settings, where automatic audio segmentation is an unavoidable component. A tool, mwerSegmenter, exists for aligning ST output to references, but its behavior is noisy and not well understood. We address this with an investigation of the effects automatic alignment on metric correlation with system-level human judgments; that is, as a metrics task. Using the eleven language tasks from the WMT24 data, we merge each system{'}s output at the domain level, align them to the references, compute metrics, and evaluate the correlation with the human system-level rankings. In addition to expanding analysis to many target languages, we also experiment with different subword models and with the generation of additional paraphrases. We find that automatic realignment has minimal effect on COMET-level system rankings, with accuracies still way above BLEU scores from manual segmentations. In the process, we also bring the community{'}s attention to the source code for the tool, which we have updated, modernized, and realized as a Python module, mweralign."
}
Markdown (Informal)
[Effects of automatic alignment on speech translation metrics](https://preview.aclanthology.org/landing_page/2025.iwslt-1.7/) (Post & Hoang, IWSLT 2025)
ACL