@inproceedings{fazli-etal-2026-inject,
title = "Inject to Heal: Alleviating hallucination in {LVLM}s via Context Embedding Injection",
author = "Fazli, Mehrdad and
Wei, Bowen and
Zhu, Ziwei",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.2048/",
pages = "41177--41193",
ISBN = "979-8-89176-395-1",
abstract = "Hallucinations{---}generating responses inconsistent with the visual input{---}remain a critical limitation of large vision-language models (LVLMs), especially in open-ended tasks such as image captioning and visual reasoning. In this work, we probe the layer-wise generation dynamics that drive hallucinations and propose a training-free mitigation strategy. Employing the Logit Lens, we examine how LVLMs construct next-token distributions across decoder layers, uncovering a pronounced commitment-depth gap: truthful tokens accumulate probability mass on their final candidates earlier than hallucinatory ones. Drawing on this discovery, we introduce Context Embedding injection (CEI), a lightweight method that harnesses the hidden state of the last input token{---}the context embedding{---}as a grounding signal to maintain visual fidelity throughout decoding and curb hallucinations. Evaluated on the CHAIR, AMBER, and MMHal-Bench benchmarks (with a maximum token length of 512), CEI outperforms state-of-the-art baselines across three LVLMs, with its dynamic variant yielding the lowest overall hallucination rates. By integrating novel mechanistic insights with a scalable intervention, this work advances the mitigation of hallucinations in LVLMs. Data and code are available at https://github.com/mehrdadfazli/CEI."
}Markdown (Informal)
[Inject to Heal: Alleviating hallucination in LVLMs via Context Embedding Injection](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.2048/) (Fazli et al., Findings 2026)
ACL