@inproceedings{xiang-etal-2025-comparing,
title = "Comparing Moral Values in {W}estern {E}nglish-speaking societies and {LLM}s with Word Associations",
author = "Xiang, Chaoyi and
Liu, Chunhua and
De Deyne, Simon and
Frermann, Lea",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.177/",
pages = "3521--3536",
ISBN = "979-8-89176-251-0",
abstract = "As the impact of large language models increases, understanding the moral values they encode becomes ever more important. Assessing moral values encoded in these models via direct prompting is challenging due to potential leakage of human norms into model training data, and their sensitivity to prompt formulation. Instead, we propose to use word associations, which have been shown to reflect moral reasoning in humans, as low-level underlying representations to obtain a more robust picture of LLMs' moral reasoning. We study moral differences in associations from western English-speaking communities and LLMs trained predominantly on English data. First, we create a large dataset of $\textit{LLM-generated}$ word associations, resembling an existing data set of $\textit{human}$ word associations. Next, we propose a novel method to propagate moral values based on seed words derived from Moral Foundation Theory through the human and LLM-generated association graphs. Finally, we compare the resulting moral representations, highlighting detailed but systematic differences between moral values emerging from English speakers and LLM associations."
}
Markdown (Informal)
[Comparing Moral Values in Western English-speaking societies and LLMs with Word Associations](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.177/) (Xiang et al., ACL 2025)
ACL