@inproceedings{kurfali-2025-conflicting,
title = "Conflicting Needles in a Haystack: How {LLM}s behave when faced with contradictory information",
author = {Kurfali, Murathan and
{\"O}stling, Robert},
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/name-variant-enfa-fane/2025.emnlp-main.1742/",
doi = "10.18653/v1/2025.emnlp-main.1742",
pages = "34349--34364",
ISBN = "979-8-89176-332-6",
abstract = "Large Language Models (LLMs) have demonstrated an impressive ability to retrieve and summarize complex information, but their reliability in conflicting contexts remains poorly understood. We introduce an adversarial extension of the Needle-in-a-Haystack framework in which three mutually exclusive ``needles'' are embedded within long documents. By systematically manipulating factors such as position, repetition, layout, and domain relevance, we evaluate how LLMs handle contradictions. We find that models almost always fail to signal uncertainty and instead confidently select a single answer, exhibiting strong and consistent biases toward repetition, recency, and particular surface forms. We further analyze whether these patterns persist across model families and sizes, and we evaluate both probability-based and generation-based retrieval. Our framework highlights critical limitations in the robustness of current LLMs{---}including commercial systems{---}to contradiction. These limitations reveal potential shortcomings in RAG systems' ability to handle noisy or manipulated inputs and exposes risks for deployment in high-stakes applications."
}Markdown (Informal)
[Conflicting Needles in a Haystack: How LLMs behave when faced with contradictory information](https://preview.aclanthology.org/name-variant-enfa-fane/2025.emnlp-main.1742/) (Kurfali & Östling, EMNLP 2025)
ACL