@inproceedings{ortu-etal-2026-seeing,
title = "When Seeing Overrides Knowing: Disentangling Knowledge Conflicts in Vision-Language Models",
author = "Ortu, Francesco and
Jin, Zhijing and
Doimo, Diego and
Cazzaniga, Alberto",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.642/",
pages = "14109--14130",
ISBN = "979-8-89176-390-6",
abstract = "Vision-language models (VLMs) increasingly combine visual and textual information to perform complex tasks. However, conflicts between their internal knowledge and external visual input can lead to hallucinations and unreliable predictions. In this work, we investigate the mechanisms that VLMs use to resolve cross-modal conflicts by introducing WHOOPS-AHA!, a dataset of multimodal counterfactual queries that deliberately contradict internal commonsense knowledge. Through logit inspection, we identify a small set of attention heads that mediate this conflict. By intervening in these heads, we can steer the model towards its internal parametric knowledge or the visual information. Our results show that attention patterns on these heads effectively locate image regions that influence visual overrides, providing a more precise attribution compared to gradient-based methods."
}Markdown (Informal)
[When Seeing Overrides Knowing: Disentangling Knowledge Conflicts in Vision-Language Models](https://preview.aclanthology.org/ingest-acl/2026.acl-long.642/) (Ortu et al., ACL 2026)
ACL