@inproceedings{yu-etal-2026-survey,
    title = "A Survey of Reinforcement Learning for Large Language Models under Data Scarcity: Challenges and Solutions",
    author = "Yu, Zhiyin  and
      Mou, Yuchen  and
      Yan, Juncheng  and
      Luo, Junyu  and
      Chen, Chunchun  and
      Wei, Xing  and
      Liu, Yunhui  and
      Sun, Hongru  and
      Zhang, Yuxing  and
      Xu, Jun  and
      Bian, Yatao  and
      Zhang, Ming  and
      Ye, Wei  and
      He, Tieke  and
      Yang, Jie  and
      Zheng, Guanjie  and
      Wu, Zhonghai  and
      Zhang, Bo  and
      Bai, Lei  and
      Luo, Xiao",
    editor = "Liakata, Maria  and
      Moreira, Viviane P.  and
      Zhang, Jiajun  and
      Jurgens, David",
    booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
    month = jul,
    year = "2026",
    address = "San Diego, California, United States",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1045/",
    pages = "22823--22846",
    ISBN = "979-8-89176-390-6"
}