@inproceedings{xu-etal-2026-arclight, title = "{A}rc{L}ight: A Lightweight {LLM} Inference Architecture for Many-Core {CPU}s", author = "Xu, Yuzhuang and Han, Xu and Li, Yuxuan and Che, Wanxiang", editor = "Durrett, Greg and Jian, Ping", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 3: System Demonstrations)", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-demo.18/", pages = "178--186", ISBN = "979-8-89176-392-0" }