@inproceedings{she-etal-2025-token, title = "Token Level Routing Inference System for Edge Devices", author = "She, Jianshu and Zheng, Wenhao and Liu, Zhengzhong and Wang, Hongyi and Xing, Eric P. and Yao, Huaxiu and Ho, Qirong", editor = "Mishra, Pushkar and Muresan, Smaranda and Yu, Tao", booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 3: System Demonstrations)", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-demo.16/", pages = "159--166", ISBN = "979-8-89176-253-4" }