@inproceedings{li-etal-2025-amphista, title = "Amphista: Bi-directional Multi-head Decoding for Accelerating {LLM} Inference", author = "Li, Zeping and Yang, Xinlong and Gao, Ziheng and Liu, Ji and Li, Guanchen and Liu, Zhuang and Li, Dong and Peng, Jinzhang and Tian, Lu and Barsoum, Emad", editor = "Chiruzzo, Luis and Ritter, Alan and Wang, Lu", booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)", month = apr, year = "2025", address = "Albuquerque, New Mexico", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/landing_page/2025.naacl-long.450/", pages = "8925--8938", ISBN = "979-8-89176-189-6" }