@inproceedings{zhao-etal-2025-fr, title = "{FR}-Spec: Accelerating Large-Vocabulary Language Models via Frequency-Ranked Speculative Sampling", author = "Zhao, Weilin and Pan, Tengyu and Han, Xu and Zhang, Yudi and Ao, Sun and Huang, Yuxiang and Zhang, Kaihuo and Zhao, Weilun and Li, Yuxuan and Zhou, Jie and Zhou, Hao and Wang, Jianyong and Sun, Maosong and Liu, Zhiyuan", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.acl-long.198/", pages = "3909--3921", ISBN = "979-8-89176-251-0" }