@inproceedings{lee-etal-2025-vision,
title = "Are Vision-Language Models Safe in the Wild? A Meme-Based Benchmark Study",
author = "Lee, DongGeon and
Jang, Joonwon and
Jeong, Jihae and
Yu, Hwanjo",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1555/",
pages = "30533--30576",
ISBN = "979-8-89176-332-6",
abstract = "Rapid deployment of vision-language models (VLMs) magnifies safety risks, yet most evaluations rely on artificial images. This study asks: How safe are current VLMs when confronted with meme images that ordinary users share? To investigate this question, we introduce MemeSafetyBench, a 50,430-instance benchmark pairing real meme images with both harmful and benign instructions. Using a comprehensive safety taxonomy and LLM-based instruction generation, we assess multiple VLMs across single and multi-turn interactions. We investigate how real-world memes influence harmful outputs, the mitigating effects of conversational context, and the relationship between model scale and safety metrics. Our findings demonstrate that VLMs are more vulnerable to meme-based harmful prompts than to synthetic or typographic images. Memes significantly increase harmful responses and decrease refusals compared to text-only inputs. Though multi-turn interactions provide partial mitigation, elevated vulnerability persists. These results highlight the need for ecologically valid evaluations and stronger safety mechanisms. MemeSafetyBench is publicly available at https://github.com/oneonlee/Meme-Safety-Bench."
}Markdown (Informal)
[Are Vision-Language Models Safe in the Wild? A Meme-Based Benchmark Study](https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1555/) (Lee et al., EMNLP 2025)
ACL