@inproceedings{choshen-abend-2018-automatic,
title = "Automatic Metric Validation for Grammatical Error Correction",
author = "Choshen, Leshem and
Abend, Omri",
editor = "Gurevych, Iryna and
Miyao, Yusuke",
booktitle = "Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2018",
address = "Melbourne, Australia",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/P18-1127/",
doi = "10.18653/v1/P18-1127",
pages = "1372--1382",
abstract = "Metric validation in Grammatical Error Correction (GEC) is currently done by observing the correlation between human and metric-induced rankings. However, such correlation studies are costly, methodologically troublesome, and suffer from low inter-rater agreement. We propose MAEGE, an automatic methodology for GEC metric validation, that overcomes many of the difficulties in the existing methodology. Experiments with MAEGE shed a new light on metric quality, showing for example that the standard $M^2$ metric fares poorly on corpus-level ranking. Moreover, we use MAEGE to perform a detailed analysis of metric behavior, showing that some types of valid edits are consistently penalized by existing metrics."
}
Markdown (Informal)
[Automatic Metric Validation for Grammatical Error Correction](https://preview.aclanthology.org/add-emnlp-2024-awards/P18-1127/) (Choshen & Abend, ACL 2018)
ACL