@inproceedings{mukherjee-shrivastava-2024-chrf,
title = "chr{F}-{S}: Semantics Is All You Need",
author = "Mukherjee, Ananya and
Shrivastava, Manish",
editor = "Haddow, Barry and
Kocmi, Tom and
Koehn, Philipp and
Monz, Christof",
booktitle = "Proceedings of the Ninth Conference on Machine Translation",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Author-page-Marten-During-lu/2024.wmt-1.33/",
doi = "10.18653/v1/2024.wmt-1.33",
pages = "470--474",
abstract = "Machine translation (MT) evaluation metrics like BLEU and chrF++ are widely used reference-based metrics that do not require training and are language-independent. However, these metrics primarily focus on n-gram matching and often overlook semantic depth and contextual understanding. To address this gap, we introduce chrF-S (Semantic chrF++), an enhanced metric that integrates sentence embeddings to evaluate translation quality more comprehensively. By combining traditional character and word n-gram analysis with semantic information derived from embeddings, chrF-S captures both syntactic accuracy and sentence-level semantics. This paper presents our contributions to the WMT24 shared metrics task, showcasing our participation and the development of chrF-S. We also demonstrate that, according to preliminary results on the leaderboard, our metric performs on par with other supervised and LLM-based metrics. By merging semantic insights with n-gram precision, chrF-S offers a significant enhancement in the assessment of machine-generated translations, advancing the field of MT evaluation. Our code and data will be made available at \url{https://github.com/AnanyaCoder/chrF-S}."
}
Markdown (Informal)
[chrF-S: Semantics Is All You Need](https://preview.aclanthology.org/Author-page-Marten-During-lu/2024.wmt-1.33/) (Mukherjee & Shrivastava, WMT 2024)
ACL
- Ananya Mukherjee and Manish Shrivastava. 2024. chrF-S: Semantics Is All You Need. In Proceedings of the Ninth Conference on Machine Translation, pages 470–474, Miami, Florida, USA. Association for Computational Linguistics.