@inproceedings{machacek-polak-2025-simultaneous,
title = "Simultaneous Translation with Offline Speech and {LLM} Models in {CUNI} Submission to {IWSLT} 2025",
author = "Mach{\'a}{\v{c}}ek, Dominik and
Pol{\'a}k, Peter",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Anastasopoulos, Antonis",
booktitle = "Proceedings of the 22nd International Conference on Spoken Language Translation (IWSLT 2025)",
month = jul,
year = "2025",
address = "Vienna, Austria (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.iwslt-1.41/",
pages = "389--398",
ISBN = "979-8-89176-272-5",
abstract = "This paper describes Charles University submission to the Simultaneous Speech Translation Task of the IWSLT 2025. We cover all four language pairs with a direct or cascade approach. The backbone of our systems is the offline Whisper speech model, which we use for both translation and transcription in simultaneous mode with the state-of-the-art simultaneous policy AlignAtt. We further improve the performance by prompting to inject in-domain terminology, and we accommodate context. Our cascaded systems further use EuroLLM for unbounded simultaneous translation. Compared to the Organizers' baseline, our systems improve by 2 BLEU points on Czech to English and 13-22 BLEU points on English to German, Chinese and Japanese on the development sets. Additionally, we also propose a new enhanced measure of speech recognition latency."
}
Markdown (Informal)
[Simultaneous Translation with Offline Speech and LLM Models in CUNI Submission to IWSLT 2025](https://preview.aclanthology.org/landing_page/2025.iwslt-1.41/) (Macháček & Polák, IWSLT 2025)
ACL