@inproceedings{chen-etal-2025-better-process, title = "Better Process Supervision with Bi-directional Rewarding Signals", author = "Chen, Wenxiang and He, Wei and Xi, Zhiheng and Guo, Honglin and Hong, Boyang and Zhang, Jiazheng and Li, Nijun and Gui, Tao and Li, Yun and Zhang, Qi and Huang, Xuanjing", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Findings of the Association for Computational Linguistics: ACL 2025", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.findings-acl.747/", pages = "14471--14485", ISBN = "979-8-89176-256-5" }