@inproceedings{lee-etal-2026-inertia,
title = "Inertia in Moral and Value Judgments of Large Language Models",
author = "Lee, Bruce W. and
Lee, Yeongheon and
Cho, Hyunsoo",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1246/",
pages = "27053--27075",
ISBN = "979-8-89176-390-6",
abstract = "Large Language Models (LLMs) behave non-deterministically, and prompting has become a common method for steering their outputs.A popular strategy is to assign a persona to the model to produce more varied, context-sensitive responses, similar to how responses vary across human individuals.Against the expectation that persona prompting yields a wide range of opinions, our experiments show that LLMs keep consistent value orientations.We observe a persistent inertia in their responses, where certain moral and value dimensions (especially harm avoidance and fairness) stay skewed in one direction across persona settings.To study this, we use role-play at scale, which pairs randomized persona prompts with a macro-level analysis of model outputs.Our results point to strong internal biases and value preferences in LLMs, which we call value orientation and inertia. These models warrant scrutiny and adjustment before use in applications where balanced outputs matter."
}Markdown (Informal)
[Inertia in Moral and Value Judgments of Large Language Models](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1246/) (Lee et al., ACL 2026)
ACL
- Bruce W. Lee, Yeongheon Lee, and Hyunsoo Cho. 2026. Inertia in Moral and Value Judgments of Large Language Models. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 27053–27075, San Diego, California, United States. Association for Computational Linguistics.