@inproceedings{taboas-garcia-wanner-2025-assessing,
title = "Assessing the Agreement Competence of Large Language Models",
author = "T{\'a}boas Garc{\'i}a, Alba and
Wanner, Leo",
editor = "Haji{\v{c}}ov{\'a}, Eva and
Kahane, Sylvain",
booktitle = "Proceedings of the Eighth International Conference on Dependency Linguistics (Depling, SyntaxFest 2025)",
month = aug,
year = "2025",
address = "Ljubljana, Slovenia",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/transition-to-people-yaml/2025.depling-1.4/",
pages = "36--53",
ISBN = "979-8-89176-290-9",
abstract = "While the competence of LLMs to cope with agreement constraints has been widely tested in English, only a very limited number of works deals with morphologically rich(er) languages. In this work, we experiment with 25 mono- and multilingual LLMs, applying them to a collection of more than 5,000 test examples that cover the main agreement phenomena in three Romance languages (Italian, Portuguese, and Spanish) and one Slavic Language (Russian). We identify which of the agreement phenomena are most difficult for which models and challenge some common assumptions of what makes a good model. The test suites into which the test examples are organized are openly available and can be easily adapted to other agreement phenomena and other languages for further research."
}
Markdown (Informal)
[Assessing the Agreement Competence of Large Language Models](https://preview.aclanthology.org/transition-to-people-yaml/2025.depling-1.4/) (Táboas García & Wanner, DepLing-SyntaxFest 2025)
ACL