@inproceedings{lin-etal-2026-safo,
title = "{SAFO}: Stable Adaptive Fairness Optimization for {LLM}-Based Social Survey Simulation",
author = "Lin, Chenxi and
Jiang, Zhuoren and
Song, Kaisong and
Wu, Yiquan",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1458/",
pages = "31626--31654",
ISBN = "979-8-89176-390-6",
abstract = "Ensuring fairness in social survey simulation is critical, as biased outputs can misrepresent underrepresented groups. This issue is growing as large language models (LLMs) are increasingly used for this task. However, standard fine-tuning based on Empirical Risk Minimization (ERM) often under-optimizes minority groups, causing substantial subgroup disparities. Distributionally robust Optimization (DRO) methods reduce worst-case errors, but their strict worst-case selection can lead to noisy and unstable optimization under demographic sparsity. These issues create intertwined challenges for fairness, convergence and stability. We propose SAFO, a dynamic utility{--}fairness optimization framework for LLM-based survey simulation that explicitly targets both fairness and training stability. SAFO combines (i) an Optimizer that preserves mean-loss utility, (ii) an Adversary that performs temperature-controlled, EMA-smoothed and loss-driven group reweighting, and (iii) a Nash-inspired Regulator that adaptively adjusts the utility{--}fairness trade-off by tracking weak-group gains and collateral utility damages. Experiments on three large-scale survey datasets from China, the U.S., and Europe show that SAFO consistently improves minority performance and social-welfare metrics. It reduces worst-group gaps by up to 12.7{\%}, maintains overall accuracy with a mean change of less than 0.3{\%} and lowers variance across random seeds. Our code is available at https://github.com/PiLab-ZJU/SAFO."
}Markdown (Informal)
[SAFO: Stable Adaptive Fairness Optimization for LLM-Based Social Survey Simulation](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1458/) (Lin et al., ACL 2026)
ACL