@inproceedings{derner-batistic-2025-gender,
title = "Gender Representation Bias Analysis in {LLM}-Generated {C}zech and {S}lovenian Texts",
author = "Derner, Erik and
Batisti{\v{c}}, Kristina",
editor = "Piskorski, Jakub and
P{\v{r}}ib{\'a}{\v{n}}, Pavel and
Nakov, Preslav and
Yangarber, Roman and
Marcinczuk, Michal",
booktitle = "Proceedings of the 10th Workshop on Slavic Natural Language Processing (Slavic NLP 2025)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/acl25-workshop-ingestion/2025.bsnlp-1.15/",
pages = "124--135",
ISBN = "978-1-959429-57-9",
abstract = "Large language models (LLMs) often reflect social biases present in their training data, including imbalances in how different genders are represented. While most prior work has focused on English, gender representation bias remains underexplored in morphologically rich languages where grammatical gender is pervasive. We present a method for detecting and quantifying such bias in Czech and Slovenian, using LLMs to classify gendered person references in LLM-generated narratives. Applying this method to outputs from a range of models, we find substantial variation in gender balance. While some models produce near-equal proportions of male and female references, others exhibit strong male overrepresentation. Our findings highlight the need for fine-grained bias evaluation in under-represented languages and demonstrate the potential of LLM-based annotation in this space. We make our code and data publicly available."
}
Markdown (Informal)
[Gender Representation Bias Analysis in LLM-Generated Czech and Slovenian Texts](https://preview.aclanthology.org/acl25-workshop-ingestion/2025.bsnlp-1.15/) (Derner & Batistič, BSNLP 2025)
ACL