@inproceedings{zhao-etal-2026-unleashing-low, title = "Unleashing Low-Bit Inference on Ascend {NPU}s: A Comprehensive Evaluation of {H}i{F}loat Formats", author = "Zhao, Pengxiang and Zhen, Hui-Ling and Li, Xing and Bao, Han and Lin, Weizhe and Yang, Zhiyuan and Wei, Yu Zi and Wang, Xin and Yuan, Mingxuan and Yu, Xianzhi and Dong, Zhenhua", editor = "Li, Yunyao and Rehm, Georg and Tu, Mei", booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL} 2026)", month = jul, year = "2026", address = "San Diego, California, USA", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.acl-industry.57/", pages = "844--864", ISBN = "979-8-89176-394-4" }