@inproceedings{bawden-sagot-2025-rocs,
title = "{R}o{CS}-{MT} v2 at {WMT} 2025: Robust Challenge Set for Machine Translation",
author = "Bawden, Rachel and
Sagot, Beno{\^i}t",
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Tenth Conference on Machine Translation",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.wmt-1.58/",
pages = "834--849",
ISBN = "979-8-89176-341-8",
abstract = "RoCS-MT (Robust Challenge Set for Machine Translation) was initially proposed at the test suites track of WMT 2023. Designed to challenge MT systems' translation performance on user-generated content (UGC), it contains examples sourced from English Reddit, with manually normalised versions, aligned labelled annotation spans and reference translations in five languages. In this article, we describe version 2 of RoCS-MT in the context of the 2025 WMT test suites track. This new version contains several improvements on the initial version including (i) minor corrections of normalisation, (ii) corrections to reference translations and addition of alternative references to accommodate for different possible genders (e.g. of speakers) and (iii) a redesign and re-annotation of normalisation spans for further analysis of different non-standard UGC phenomena. We describe these changes and provide results and preliminary analysis of the MT submissions to the 2025 general translation task."
}Markdown (Informal)
[RoCS-MT v2 at WMT 2025: Robust Challenge Set for Machine Translation](https://preview.aclanthology.org/ingest-emnlp/2025.wmt-1.58/) (Bawden & Sagot, WMT 2025)
ACL