@inproceedings{chen-etal-2025-clasp, title = "{CL}a{S}p: In-Context Layer Skip for Self-Speculative Decoding", author = "Chen, Longze and Shan, Renke and Wang, Huiming and Wang, Lu and Liu, Ziqiang and Luo, Run and Wang, Jiawei and Alinejad-Rokny, Hamid and Yang, Min", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.acl-long.1525/", pages = "31608--31618", ISBN = "979-8-89176-251-0" }