@inproceedings{belz-thomson-2023-2023,
title = "The 2023 {R}epro{NLP} Shared Task on Reproducibility of Evaluations in {NLP}: Overview and Results",
author = "Belz, Anya and
Thomson, Craig",
editor = "Belz, Anya and
Popovi{\'c}, Maja and
Reiter, Ehud and
Thomson, Craig and
Sedoc, Jo{\~a}o",
booktitle = "Proceedings of the 3rd Workshop on Human Evaluation of NLP Systems",
month = sep,
year = "2023",
address = "Varna, Bulgaria",
publisher = "INCOMA Ltd., Shoumen, Bulgaria",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.humeval-1.4/",
pages = "35--48",
abstract = "This paper presents an overview of, and the results from, the 2023 Shared Task on Reproducibility of Evaluations in NLP (ReproNLP`23), following on from two previous shared tasks on reproducibility of evaluations in NLG, ReproGen`21 and ReproGen`22. This shared task series forms part of an ongoing research programme designed to develop theory and practice of reproducibility assessment in NLP and machine learning, all against a background of an interest in reproducibility that con- tinues to grow in the two fields. This paper describes the ReproNLP`23 shared task, summarises results from the reproduction studies submitted, and provides comparative analysis of the results."
}
Markdown (Informal)
[The 2023 ReproNLP Shared Task on Reproducibility of Evaluations in NLP: Overview and Results](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.humeval-1.4/) (Belz & Thomson, HumEval 2023)
ACL