@inproceedings{xiang-etal-2026-llm,
title = "{LLM}-as-Scheduler: Agentic Workflow Dynamic Scheduling",
author = "Xiang, Dawei and
Chu, Kexin and
Xu, Wenyan and
Zhang, Wenhui and
Zhang, Wei",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.581/",
pages = "12752--12763",
ISBN = "979-8-89176-390-6",
abstract = "As large language models (LLMs) improve, many applications are moving from a single LLM call to multi-agent systems. These systems often rely on either hand-designed or automatically optimized workflows with multiple verification and testing steps. While those extra steps can improve accuracy, they also increase latency and token costs. In practice, many queries do not need such heavy processing and can be handled well by a single strong agent.To address this inefficiency, we propose LLM-as-Scheduler (LAS), a system that dynamically chooses the right workflow for each query. LAS uses a two-stage cascade: first, a lightweight gate quickly evaluates each agent{'}s output; then, an LLM-based scheduler uses query features and gate signals to make more detailed routing decisions. Experiments show that LAS cuts token usage by 43{\%} and reduces end-to-end latency by more than 36{\%}, while causing at most a 1.4 percentage-point drop in accuracy compared with a strong fixed workflow."
}Markdown (Informal)
[LLM-as-Scheduler: Agentic Workflow Dynamic Scheduling](https://preview.aclanthology.org/ingest-acl/2026.acl-long.581/) (Xiang et al., ACL 2026)
ACL
- Dawei Xiang, Kexin Chu, Wenyan Xu, Wenhui Zhang, and Wei Zhang. 2026. LLM-as-Scheduler: Agentic Workflow Dynamic Scheduling. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 12752–12763, San Diego, California, United States. Association for Computational Linguistics.