@inproceedings{yu-etal-2025-slender, title = "Slender-Mamba: Fully Quantized Mamba in 1.58 Bits From Head to Toe", author = "Yu, Zhenxuan and Kojima, Takeshi and Matsuo, Yutaka and Iwasawa, Yusuke", editor = "Rambow, Owen and Wanner, Leo and Apidianaki, Marianna and Al-Khalifa, Hend and Eugenio, Barbara Di and Schockaert, Steven", booktitle = "Proceedings of the 31st International Conference on Computational Linguistics", month = jan, year = "2025", address = "Abu Dhabi, UAE", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2025.coling-main.316/", pages = "4715--4724" }