@inproceedings{gu-etal-2026-qarl, title = "{Q}a{RL}: Rollout-Aligned Quantization-Aware {RL} for Fast and Stable Training under Training{--}Inference Mismatch", author = "Gu, Hao and Wang, Hao and Liu, Jiacheng and Li, Lujun and Zhu, Qiyuan and Liu, Bei and Xu, Binxing and Wang, Lei and Yang, Xintong and Lin, Sida and Han, Sirui and Guo, Yike", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.841/", pages = "17051--17064", ISBN = "979-8-89176-395-1" }