@inproceedings{ali-etal-2026-reference,
title = "Reference Games as a Testbed for the Alignment of Model Uncertainty and Clarification Requests",
author = "Ali, Manar and
Sieker, Judith and
Zarrie{\ss}, Sina and
Buschmeier, Hendrik",
editor = "Mille, Simon and
Gehrmann, Sebastian and
Schmidtov{\'a}, Patr{\'i}cia and
Du{\v{s}}ek, Ond{\v{r}}ej and
Fadaee, Marzieh and
Lo, Kyle and
Santus, Enrico and
Stanovsky, Gabriel",
booktitle = "Proceedings of the Fifth Workshop on Generation, Evaluation and Metrics ({GEM})",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.76/",
pages = "990--998",
ISBN = "979-8-89176-423-1",
abstract = "In human conversation, both interlocutors play an active role in maintaining mutual understanding. When listeners are uncertain about what speakers mean, for example, they can request clarification. It is an open question for language models whether they can assume a similar listener role, recognizing and expressing their own uncertainty through clarification. We argue that reference games are a suitable testbed to approach this question as they are controlled, self-contained, and make clarification needs explicit and measurable. To test this, we evaluate three vision-language models comparing a baseline reference resolution task to an experiment where the models are instructed to request clarification when uncertain. The results suggest that even in such simple tasks, models often struggle to recognize internal uncertainty and translate it into adequate clarification behavior. This demonstrates the value of reference games as testbeds for interaction qualities of (vision and) language models."
}Markdown (Informal)
[Reference Games as a Testbed for the Alignment of Model Uncertainty and Clarification Requests](https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.76/) (Ali et al., GEM 2026)
ACL