@inproceedings{cui-etal-2026-rethinking,
title = "Rethinking Assessments of Prompt Injection Attacks",
author = "Cui, Chi and
Wu, Yixin and
Backes, Michael and
Zhang, Yang",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1191/",
pages = "23773--23799",
ISBN = "979-8-89176-395-1",
abstract = "Prompt injection attacks are recognized as one of the primary risks faced by LLM-integrated applications in recent years. However, common evaluation frameworks remain insufficient, lacking comprehensiveness and real-world relevance. To bridge this gap, we revisit the common evaluation framework and conduct an extensive evaluation across eight different evaluation settings, including 37 real-world applications, 185 injected tasks, 21 attack instructions, and a total of 143,745 queries. The evaluation highlights several findings. For example, real-world applications are more vulnerable to prompt injection attacks compared to those used in research settings. While complex attack instructions are more sophisticated, they are less effective than simple attack instructions. We further conduct an assessment of both prompt-level and model-level defense mechanisms and highlight their limitations in real-world applications. By exploring more diverse scenarios across different dimensions, our framework provides a solid foundation for assessing vulnerabilities in LLM-integrated applications and evaluating the efficacy of defensive strategies."
}Markdown (Informal)
[Rethinking Assessments of Prompt Injection Attacks](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1191/) (Cui et al., Findings 2026)
ACL
- Chi Cui, Yixin Wu, Michael Backes, and Yang Zhang. 2026. Rethinking Assessments of Prompt Injection Attacks. In Findings of the Association for Computational Linguistics: ACL 2026, pages 23773–23799, San Diego, California, United States. Association for Computational Linguistics.