@inproceedings{lin-etal-2025-step, title = "Step-{KTO}: Optimizing Mathematical Reasoning through Stepwise Binary Feedback", author = "Lin, Yen-Ting and Jin, Di and Xu, Tengyu and Wu, Tianhao and Sukhbaatar, Sainbayar and Zhu, Chen and He, Yun and Chen, Yun-Nung and Weston, Jason E and Tian, Yuandong and Rahnama, Arash and Wang, Sinong and Ma, Hao and Fang, Han", editor = "Valentino, Marco and Ferreira, Deborah and Thayaparan, Mokanarangan and Ranaldi, Leonardo and Freitas, Andre", booktitle = "Proceedings of The 3rd Workshop on Mathematical Natural Language Processing (MathNLP 2025)", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-emnlp/2025.mathnlp-main.2/", pages = "15--33", ISBN = "979-8-89176-348-7" }