@inproceedings{wu-etal-2025-socialcc,
title = "{S}ocial{CC}: Interactive Evaluation for Cultural Competence in Language Agents",
author = "Wu, Jincenzi and
Lian, Jianxun and
Wang, Dingdong and
Meng, Helen M.",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.1594/",
pages = "33242--33271",
ISBN = "979-8-89176-251-0",
abstract = "Large Language Models (LLMs) are increasingly deployed worldwide, yet their ability to navigate cultural nuances remains underexplored. Misinterpreting cultural content can lead to AI-generated responses that are offensive or inappropriate, limiting their usability in global applications such as customer service, diplomatic communication, and online education. While prior research has evaluated cultural knowledge of LLMs, existing benchmarks fail to assess dynamic cultural competence-the ability to apply cultural knowledge effectively in real-world interactions. To address this gap, we introduce SocialDuolingo, a novel benchmark designed to evaluate cultural competence through multi-turn interactive intercultural scenarios. It comprises 3,060 human-written scenarios spanning 60 countries across six continents. Through extensive experiments on eight prominent LLMs, our findings reveal a significant gap between the cultural knowledge stored in these models and their ability to apply it effectively in cross-cultural communication."
}
Markdown (Informal)
[SocialCC: Interactive Evaluation for Cultural Competence in Language Agents](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.1594/) (Wu et al., ACL 2025)
ACL