@inproceedings{chen-etal-2026-figure,
title = "Figure It Out: Improve the Frontier of Reasoning with Executable Visual States",
author = "Chen, Meiqi and
Meng, Fandong and
Zhou, Jie",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1827/",
pages = "39375--39388",
ISBN = "979-8-89176-390-6",
abstract = "Complex reasoning problems often involve implicit spatial and geometric relationships that are not explicitly encoded in text. While recent reasoning models perform well across many domains, purely text-based reasoning struggles to capture structural constraints in complex settings. In this paper, we introduce FIGR, which integrates executable visual construction into multi-turn reasoning via end-to-end reinforcement learning. Rather than relying solely on textual chains of thought, FIGR externalizes intermediate hypotheses by generating executable code that constructs diagrams within the reasoning loop. An adaptive reward mechanism selectively regulates when visual construction is invoked, enabling more consistent reasoning over latent global properties that are difficult to infer from text alone. Experiments on seven challenging mathematical benchmarks demonstrate that FIGR outperforms strong text-only chain-of-thought baselines, improving the base model by 13.12{\%} on AIME 2025 and 11.00{\%} on BeyondAIME. These results highlight the effectiveness of precise, controllable figure construction of FIGR in enhancing complex reasoning ability."
}Markdown (Informal)
[Figure It Out: Improve the Frontier of Reasoning with Executable Visual States](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1827/) (Chen et al., ACL 2026)
ACL