@inproceedings{holsman-etal-2025-fuzzy, title = "Fuzzy Speculative Decoding for a Tunable Accuracy-Runtime Tradeoff", author = "Holsman, Maximilian and Huang, Yukun and Dhingra, Bhuwan", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Findings of the Association for Computational Linguistics: ACL 2025", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/transition-to-people-yaml/2025.findings-acl.1346/", doi = "10.18653/v1/2025.findings-acl.1346", pages = "26257--26273", ISBN = "979-8-89176-256-5" }