@inproceedings{zhao-etal-2024-sego,
title = "{SEGO}: Sequential Subgoal Optimization for Mathematical Problem-Solving",
author = "Zhao, Xueliang and
Huang, Xinting and
Bi, Wei and
Kong, Lingpeng",
editor = "Ku, Lun-Wei and
Martins, Andre and
Srikumar, Vivek",
booktitle = "Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = aug,
year = "2024",
address = "Bangkok, Thailand",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.acl-long.407/",
doi = "10.18653/v1/2024.acl-long.407",
pages = "7544--7565",
abstract = "Large Language Models (LLMs) have driven substantial progress in artificial intelligence in recent years, exhibiting impressive capabilities across a wide range of tasks, including mathematical problem-solving. Inspired by the success of subgoal-based methods, we propose a novel framework called \textbf{SE}quential sub\textbf{G}oal \textbf{O}ptimization (SEGO) to enhance LLMs' ability to solve mathematical problems. By establishing a connection between the subgoal breakdown process and the probability of solving problems, SEGO aims to identify better subgoals with theoretical guarantees. Addressing the challenge of identifying suitable subgoals in a large solution space, our framework generates problem-specific subgoals and adjusts them according to carefully designed criteria. Incorporating these optimized subgoals into the policy model training leads to significant improvements in problem-solving performance. We validate SEGO{'}s efficacy through experiments on two benchmarks, GSM8K and MATH, where our approach outperforms existing methods, highlighting the potential of SEGO in AI-driven mathematical problem-solving."
}
Markdown (Informal)
[SEGO: Sequential Subgoal Optimization for Mathematical Problem-Solving](https://preview.aclanthology.org/fix-sig-urls/2024.acl-long.407/) (Zhao et al., ACL 2024)
ACL