@inproceedings{fridriksdottir-einarsson-2024-gendered,
title = "Gendered Grammar or Ingrained Bias? Exploring Gender Bias in {I}celandic Language Models",
author = "Fri{\dh}riksd{\'o}ttir, Steinunn Rut and
Einarsson, Hafsteinn",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.lrec-main.671/",
pages = "7596--7610",
abstract = "Large language models, trained on vast datasets, exhibit increased output quality in proportion to the amount of data that is used to train them. This data-driven learning process has brought forth a pressing issue where these models may not only reflect but also amplify gender bias, racism, religious prejudice, and queerphobia present in their training data that may not always be recent. This study explores gender bias in language models trained on Icelandic, focusing on occupation-related terms. Icelandic is a highly grammatically gendered language that favors the masculine when referring to groups of people with indeterminable genders. Our aim is to explore whether language models merely mirror gender distributions within the corresponding professions or if they exhibit biases tied to their grammatical genders. Results indicate a significant overall predisposition towards the masculine but specific occupation terms consistently lean toward a particular gender, indicating complex interplays of societal and linguistic influences."
}
Markdown (Informal)
[Gendered Grammar or Ingrained Bias? Exploring Gender Bias in Icelandic Language Models](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.lrec-main.671/) (Friðriksdóttir & Einarsson, LREC-COLING 2024)
ACL