@inproceedings{wang-etal-2026-ro,
title = "Ro-{SLM}: Onboard Small Language Models for Robot Task Planning and Operation Code Generation",
author = "Wang, Wenhao and
Li, Yanyan and
Jiao, Long and
Yuan, Jiawei",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1720/",
pages = "34436--34460",
ISBN = "979-8-89176-395-1",
abstract = "Recent advances in large language models (LLMs) provide robots with contextual reasoning abilities to comprehend human instructions. Yet, current LLM-enabled robots typically depend on cloud-based models or high-performance computing infrastructure, which limit their deployment on robots under unreliable internet environments or with constrained computational resources, such as UAVs and small ground vehicles. Thus, deploying fine-tuned small language models (SLMs) that support onboard deployment offers a promising alternative. This paper introduces Ro-SLM, a framework that enables reliable SLM-driven robot operation by distilling LLMs' knowledge and reasoning. Ro-SLM starts from dataset synthesis by leveraging LLMs to generate diverse task instructions, produce corresponding ground truth code with minimal human assistance, and augment instructions into real-world application scenarios. Ro-SLM is then fine-tuned with the dataset, in which LLM serves as a reward function to guide the training. Extensive experiments on UAV operation tasks demonstrate that Ro-SLM improves the performance of SLM from being incapable of supporting robotic task planning and code generation to achieving performance that approaches LLM."
}Markdown (Informal)
[Ro-SLM: Onboard Small Language Models for Robot Task Planning and Operation Code Generation](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1720/) (Wang et al., Findings 2026)
ACL