@inproceedings{wang-etal-2025-inreact,
title = "{INREACT}: An Inspire-Then-Reinforce Training Framework For Multimodal {GUI} Agent",
author = "Wang, Yuanlei and
Zhang, Liuzhou and
Luo, Haohao and
Shen, Ying",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.486/",
doi = "10.18653/v1/2025.findings-emnlp.486",
pages = "9148--9160",
ISBN = "979-8-89176-335-7",
abstract = "Graphical User Interface (GUI) interaction, which aims to develop an intelligent GUI agent that executes user instructions to perform tasks such as installing applications by controlling digital devices, has gained significant attention due to its practical value. Although current advanced multimodal large language models (LLMs) provide GUI agents with robust perception and reasoning capabilities, they often struggle with the precise localization of small elements. To tackle this problem, we propose InReAct, a multimodal GUI agent framework that unifies observing, thinking, and acting for precise and interpretable decision-making. It is trained via a two-stage process: curriculum learning to progressively build perception, grounding, and reasoning abilities, followed by reinforcement learning to refine pixel-level grounding with an outcome-based reward. We introduce a rule-based reward function that jointly optimizes action-type selection and pixel-level localization accuracy. Experimental results on multiple datasets demonstrate the superiority of InReAct in both grounding and navigation tasks."
}Markdown (Informal)
[INREACT: An Inspire-Then-Reinforce Training Framework For Multimodal GUI Agent](https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.486/) (Wang et al., Findings 2025)
ACL