@inproceedings{tehenan-etal-2025-mpta,
title = "{MPTA}: {M}ulti{T}ask Personalization Assessment",
author = "Tehenan, Matthieu and
Chamoun, Eric and
Vlachos, Andreas",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/name-variant-enfa-fane/2025.findings-emnlp.640/",
doi = "10.18653/v1/2025.findings-emnlp.640",
pages = "11982--11992",
ISBN = "979-8-89176-335-7",
abstract = "Large language models are increasingly expected to adapt to individual users, reflecting differences in preferences, values, and communication styles. To evaluate whether models can serve diverse populations, we introduce MTPA, a benchmark that leverages large-scale survey data (WVS, EVS, GSS) to construct real, hyper-granular personas spanning demographics, beliefs, and values. Unlike prior benchmarks that rely on synthetic profiles or narrow trait prediction, MTPA conditions models on real personas and systematically tests their behavior across core alignment tasks. We show that persona conditioning exposes pluralistic misalignment: while aggregate metrics suggest models are truthful and safe, subgroup-specific evaluations reveal hidden pockets of degraded factuality, fairness disparities, and inconsistent value alignment. Alongside the benchmark, we release a dataset, toolkit, and baseline evaluations. MTPA is designed with extensibility and sustainability in mind: as the underlying survey datasets are regularly updated, MTPA supports regular integration of new populations and user traits."
}Markdown (Informal)
[MPTA: MultiTask Personalization Assessment](https://preview.aclanthology.org/name-variant-enfa-fane/2025.findings-emnlp.640/) (Tehenan et al., Findings 2025)
ACL
- Matthieu Tehenan, Eric Chamoun, and Andreas Vlachos. 2025. MPTA: MultiTask Personalization Assessment. In Findings of the Association for Computational Linguistics: EMNLP 2025, pages 11982–11992, Suzhou, China. Association for Computational Linguistics.