@inproceedings{wang-etal-2025-adversarial, title = "Adversarial Preference Learning for Robust {LLM} Alignment", author = "Wang, Yuanfu and Wang, Pengyu and Xi, Chenyang and Tang, Bo and Zhu, Junyi and Wei, Wenqiang and Chen, Chen and Yang, Chao and Zhang, Jingfeng and Lu, Chaochao and Niu, Yijun and Mao, Keming and Li, Zhiyu and Xiong, Feiyu and Hu, Jie and Yang, Mingchuan", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Findings of the Association for Computational Linguistics: ACL 2025", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/display_plenaries/2025.findings-acl.1126/", pages = "21865--21881", ISBN = "979-8-89176-256-5" }