@inproceedings{holtermann-etal-2026-sos,
title = "{S}o{S}: Analysis of Surface over Semantics in Multilingual Text-To-Image Generation",
author = "Holtermann, Carolin and
Schneider, Florian and
Lauscher, Anne",
editor = "Demberg, Vera and
Inui, Kentaro and
Marquez, Llu{\'i}s",
booktitle = "Proceedings of the 19th Conference of the {E}uropean Chapter of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.eacl-long.185/",
pages = "3955--3995",
ISBN = "979-8-89176-380-7",
abstract = "Text-to-image (T2I) models are increasingly employed by users worldwide. However, prior research has pointed to the high sensitivity of T2I towards particular input languages - when faced with languages other than English (i.e., different surface forms of the same prompt), T2I models often produce culturally stereotypical depictions, prioritizing the surface over the prompt{'}s semantics. Yet a comprehensive analysis of this behavior, which we dub Surface-over-Semantics (SoS), is missing. We present the first analysis of T2I models' SoS tendencies. To this end, we create a set of prompts covering 171 cultural identities, translated into 14 languages, and use it to prompt seven T2I models. To quantify SoS tendencies across models, languages, and cultures, we introduce a novel measure and analyze how the tendencies we identify manifest visually. We show that all but one model exhibit strong surface-level tendency in at least two languages, with this effect intensifying across the layers of T2I text encoders. Moreover, these surface tendencies frequently correlate with stereotypical visual depictions."
}Markdown (Informal)
[SoS: Analysis of Surface over Semantics in Multilingual Text-To-Image Generation](https://preview.aclanthology.org/ingest-eacl/2026.eacl-long.185/) (Holtermann et al., EACL 2026)
ACL