@inproceedings{yu-etal-2026-survey, title = "A Survey of Reinforcement Learning for Large Language Models under Data Scarcity: Challenges and Solutions", author = "Yu, Zhiyin and Mou, Yuchen and Yan, Juncheng and Luo, Junyu and Chen, Chunchun and Wei, Xing and Liu, Yunhui and Sun, Hongru and Zhang, Yuxing and Xu, Jun and Bian, Yatao and Zhang, Ming and Ye, Wei and He, Tieke and Yang, Jie and Zheng, Guanjie and Wu, Zhonghai and Zhang, Bo and Bai, Lei and Luo, Xiao", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1045/", pages = "22823--22846", ISBN = "979-8-89176-390-6" }