@inproceedings{chen-etal-2024-improving, title = "Improving Large Language Models via Fine-grained Reinforcement Learning with Minimum Editing Constraint", author = "Chen, Zhipeng and Zhou, Kun and Zhao, Xin and Wan, Junchen and Zhang, Fuzheng and Zhang, Di and Wen, Ji-Rong", editor = "Ku, Lun-Wei and Martins, Andre and Srikumar, Vivek", booktitle = "Findings of the Association for Computational Linguistics: ACL 2024", month = aug, year = "2024", address = "Bangkok, Thailand", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-acl.338/", doi = "10.18653/v1/2024.findings-acl.338", pages = "5694--5711" }