@inproceedings{zhang-etal-2025-argent,
title = "{ARGENT}: Automatic Reference-free Evaluation for Open-Ended Text Generation without Source Inputs",
author = "Zhang, Xinyue and
Zecevic, Agathe and
Zeki, Sebastian and
Roberts, Angus",
editor = "Dhole, Kaustubh and
Clinciu, Miruna",
booktitle = "Proceedings of the Fourth Workshop on Generation, Evaluation and Metrics (GEM{\texttwosuperior})",
month = jul,
year = "2025",
address = "Vienna, Austria and virtual meeting",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/transition-to-people-yaml/2025.gem-1.8/",
pages = "82--98",
ISBN = "979-8-89176-261-9",
abstract = "With increased accessibility of machine-generated texts, the need for their evaluation has also grown. There are broadly two types of text generation tasks. In open-ended generation tasks (OGTs), the model generates de novo text without any input on which to base it, such as story generation. In reflective generation tasks (RGTs), the model output is generated to reflect an input sequence, such as in machine translation. There are many studies on RGT evaluation, where the metrics typically compare one or more gold-standard references to the model output. Evaluation of OGTs has received less attention and is more challenging: since the task does not aim to reflect an input, there are usually no reference texts. In this paper, we propose a new perspective that unifies OGT evaluation with RGT evaluation, based on which we develop an automatic, reference-free generative text evaluation model (ARGENT), and review previous literature from this perspective. Our experiments demonstrate the effectiveness of these methods across informal, formal, and domain-specific texts. We conduct a meta-evaluation to compare existing and proposed metrics, finding that our approach aligns more closely with human judgement."
}
Markdown (Informal)
[ARGENT: Automatic Reference-free Evaluation for Open-Ended Text Generation without Source Inputs](https://preview.aclanthology.org/transition-to-people-yaml/2025.gem-1.8/) (Zhang et al., GEM 2025)
ACL