@inproceedings{tan-etal-2026-triplay, title = "{T}ri{P}lay-{RL}: Tri-Role Self-Play Reinforcement Learning for {LLM} Safety Alignment", author = "Tan, Zhewen and Yu, Wenhan and Si, Jianfeng and Liu, Tongxin and Guan, Kaiqi and Jin, Huiyan and Tao, Jiawen and Yuan, Xiaokun and Zhang, Xiangzheng and Ma, Duohe and Yang, Tong and Sun, Lin", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1216/", pages = "26415--26429", ISBN = "979-8-89176-390-6" }