@inproceedings{yu-etal-2025-self, title = "Self-Generated Critiques Boost Reward Modeling for Language Models", author = "Yu, Yue and Chen, Zhengxing and Zhang, Aston and Tan, Liang and Zhu, Chenguang and Pang, Richard Yuanzhe and Qian, Yundi and Wang, Xuewei and Gururangan, Suchin and Zhang, Chao and Kambadur, Melanie and Mahajan, Dhruv and Hou, Rui", editor = "Chiruzzo, Luis and Ritter, Alan and Wang, Lu", booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)", month = apr, year = "2025", address = "Albuquerque, New Mexico", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.naacl-long.573/", pages = "11499--11514", ISBN = "979-8-89176-189-6" }