@inproceedings{barreto-jana-2025-disimprovement,
title = "This is not a Disimprovement: Improving Negation Reasoning in Large Language Models via Prompt Engineering",
author = "Barreto, Joshua Jose Dias and
Jana, Abhik",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.761/",
doi = "10.18653/v1/2025.findings-emnlp.761",
pages = "14149--14156",
ISBN = "979-8-89176-335-7",
abstract = "Negation reasoning remains a challenge for large language models (LLMs), often causing incorrect interpretations of negated statements. In this study, we analyze various LLMs for their handling of negation and propose two genres of prompts (*Warning-based* and *Persona-based*), which improve overall absolute accuracy by up to 3.17{\%} and distractor negation accuracy by up to 25.14{\%} over most competitive baselines. Next, we assess the robustness of LLMs by reordering prompts while preserving meaning, observing instability linked to positional encoding schemes. Further, we introduce a negative token attention score (NTAS) to quantify attention to negation words. From the comprehensive analysis, we point out that within a specific LLM family, the performance of a model (measured using accuracy) correlates more with NTAS than with model size. The code is publicly available: [https://github.com/Joshua-Dias-Barreto/This-is-not-a-Disimprovement](https://github.com/Joshua-Dias-Barreto/This-is-not-a-Disimprovement)"
}Markdown (Informal)
[This is not a Disimprovement: Improving Negation Reasoning in Large Language Models via Prompt Engineering](https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.761/) (Barreto & Jana, Findings 2025)
ACL