@inproceedings{von-daniken-etal-2025-measure,
title = "A Measure of the System Dependence of Automated Metrics",
author = {Von D{\"a}niken, Pius and
Deriu, Jan Milan and
Cieliebak, Mark},
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-short.8/",
pages = "87--99",
ISBN = "979-8-89176-252-7",
abstract = "Automated metrics for Machine Translation have made significant progress, with the goal of replacing expensive and time-consuming human evaluations. These metrics are typically assessed by their correlation with human judgments, which captures the monotonic relationship between human and metric scores. However, we argue that it is equally important to ensure that metrics treat all systems fairly and consistently. In this paper, we introduce a method to evaluate this aspect."
}
Markdown (Informal)
[A Measure of the System Dependence of Automated Metrics](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-short.8/) (Von Däniken et al., ACL 2025)
ACL
- Pius Von Däniken, Jan Milan Deriu, and Mark Cieliebak. 2025. A Measure of the System Dependence of Automated Metrics. In Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pages 87–99, Vienna, Austria. Association for Computational Linguistics.