@inproceedings{lee-etal-2026-tagquant, title = "{TAGQ}uant: Token-Aware Clustering for Group-Wise Quantization", author = "Lee, Jaeseong and Hwang, Seung-won and Qiao, Aurick and Yao, Zhewei and He, Yuxiong", editor = {Matusevych, Yevgen and Eryi{\u{g}}it, G{\"u}l{\c{s}}en and Aletras, Nikolaos}, booktitle = "Proceedings of the 19th Conference of the {E}uropean Chapter of the {A}ssociation for {C}omputational {L}inguistics (Volume 5: Industry Track)", month = mar, year = "2026", address = "Rabat, Morocco", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-eacl/2026.eacl-industry.18/", pages = "253--262", ISBN = "979-8-89176-384-5" }