@inproceedings{wei-etal-2026-anchor,
title = "Anchor: Branch-Point Data Generation for {GUI} Agents",
author = "Wei, Jinbiao and
Zhao, Yilun and
Ni, Kangqi and
Cohan, Arman",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.774/",
pages = "17031--17047",
ISBN = "979-8-89176-390-6",
abstract = "End-to-end GUI agents for real desktop environments require large amounts of high-quality interaction data, yet collecting human demonstrations is expensive and existing synthetic pipelines often suffer from limited task diversity or noisy, goal-drifting trajectories. We present a trajectory expansion framework Anchor that bootstraps scalable desktop supervision from a small set of verified seed demonstrations. Starting from each seed, we identify branch points that correspond to meaningful state changes and propose new, state-grounded task variants conditioned on the current GUI context. An executing agent then follows the proposed instructions to generate new trajectories, while a verifier enforces task completion via state-aware checks and trajectory-level consistency. To improve supervision quality, we further apply task-conditioned step-level filtering to remove ungrounded actions and denoise post-branch segments to maintain coherent intent. Experiments on standard desktop benchmarks, OSWorld and WindowsAgentArena, show that models fine-tuned on our expanded corpus achieve consistent improvements over zero-shot agents and representative synthesis baselines, and generalize across applications and operating systems."
}Markdown (Informal)
[Anchor: Branch-Point Data Generation for GUI Agents](https://preview.aclanthology.org/ingest-acl/2026.acl-long.774/) (Wei et al., ACL 2026)
ACL
- Jinbiao Wei, Yilun Zhao, Kangqi Ni, and Arman Cohan. 2026. Anchor: Branch-Point Data Generation for GUI Agents. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 17031–17047, San Diego, California, United States. Association for Computational Linguistics.