@inproceedings{jung-etal-2024-explainable,
title = "Explainable {CED}: A Dataset for Explainable Critical Error Detection in Machine Translation",
author = "Jung, Dahyun and
Eo, Sugyeong and
Park, Chanjun and
Lim, Heuiseok",
editor = "Cao, Yang (Trista) and
Papadimitriou, Isabel and
Ovalle, Anaelia and
Zampieri, Marcos and
Ferraro, Francis and
Swayamdipta, Swabha",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 4: Student Research Workshop)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.naacl-srw.4/",
doi = "10.18653/v1/2024.naacl-srw.4",
pages = "25--35",
abstract = "Critical error detection (CED) in machine translation is a task that aims to detect errors that significantly distort the intended meaning. However, the existing study of CED lacks explainability due to the absence of content addressing the reasons for catastrophic errors. To address this limitation, we propose Explainable CED, a dataset that introduces the attributes of error explanation and correction regarding critical errors. Considering the advantage of reducing time costs and mitigating human annotation bias, we leverage a large language model in the data construction process. To improve the quality of the dataset and mitigate hallucination, we compare responses from the model and introduce an additional data filtering method through feedback scoring. The experiment demonstrates that the dataset appropriately reflects a consistent explanation and revision for errors, validating the reliability of the dataset."
}
Markdown (Informal)
[Explainable CED: A Dataset for Explainable Critical Error Detection in Machine Translation](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.naacl-srw.4/) (Jung et al., NAACL 2024)
ACL