@inproceedings{wu-etal-2025-analysing,
title = "Analysing Reference Production of Large Language Models",
author = "Wu, Chengzhao and
Chen, Guanyi and
Same, Fahime and
He, Tingting",
editor = "Flek, Lucie and
Narayan, Shashi and
Phương, L{\^e} Hồng and
Pei, Jiahuan",
booktitle = "Proceedings of the 18th International Natural Language Generation Conference",
month = oct,
year = "2025",
address = "Hanoi, Vietnam",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/author-page-lei-gao-usc/2025.inlg-main.12/",
pages = "182--194",
abstract = "This study investigates how large language models (LLMs) produce referring expressions (REs) and to what extent their behaviour aligns with human patterns. We evaluate LLM performance in two settings: slot filling, {\%}KvD the conventional task of referring expression generation, where REs are generated within a fixed context, and language generation, where REs are analysed within fully generated texts. Using the WebNLG corpus, we assess how well LLMs capture human variation in reference production and analyse their behaviour by examining the influence of several factors known to affect human reference production, including referential form, syntactic position, recency, and discourse status. Our findings show that (1) task framing significantly affects LLMs' reference production; (2) while LLMs are sensitive to some of these factors, their referential behaviour consistently diverges from human use; and (3) larger model size does not necessarily yield more human-like variation. These results underscore key limitations in current LLMs' ability to replicate human referential choices."
}Markdown (Informal)
[Analysing Reference Production of Large Language Models](https://preview.aclanthology.org/author-page-lei-gao-usc/2025.inlg-main.12/) (Wu et al., INLG 2025)
ACL