@inproceedings{farzi-etal-2026-sycophancy,
title = "Sycophancy Negatively Affects {LLM}-as-a-Judge in Conflict Evaluation",
author = "Farzi, Naghmeh and
Dietz, Laura and
Carton, Samuel",
editor = "Mille, Simon and
Gehrmann, Sebastian and
Schmidtov{\'a}, Patr{\'i}cia and
Du{\v{s}}ek, Ond{\v{r}}ej and
Fadaee, Marzieh and
Lo, Kyle and
Santus, Enrico and
Stanovsky, Gabriel",
booktitle = "Proceedings of the Fifth Workshop on Generation, Evaluation and Metrics ({GEM})",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.45/",
pages = "490--501",
ISBN = "979-8-89176-423-1",
abstract = "LLM-as-Judge systems are increasingly used to generate labels and evaluate conversational data, yet their susceptibility to narrative framing remains underexplored. We study whether replacing one speaker{'}s username with the first-person identifier `Me' systematically biases model judgments independent of the underlying evidence. Using the Conversations Gone Awry corpus, we evaluate four LLMs across three judgment tasks (attack detection, attacker identification, and blame attribution), three perspective conditions, and two evidence visibility settings. Our results show that narrative perspective induces strong, task-dependent distortions, particularly in more subjective judgment tasks. We find that models systematically favor the narrator when a speaker is presented as `Me', reducing blame and responsibility attribution toward that speaker even when the underlying evidence is unchanged. These findings raise concerns about using LLMs to judge or moderate first-person conversational data."
}Markdown (Informal)
[Sycophancy Negatively Affects LLM-as-a-Judge in Conflict Evaluation](https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.45/) (Farzi et al., GEM 2026)
ACL