@inproceedings{tian-etal-2025-espnet, title = "{ESP}net-{S}peech{LM}: An Open Speech Language Model Toolkit", author = "Tian, Jinchuan and Shi, Jiatong and Chen, William and Arora, Siddhant and Masuyama, Yoshiki and Maekaku, Takashi and Wu, Yihan and Peng, Junyi and Bharadwaj, Shikhar and Zhao, Yiwen and Cornell, Samuele and Peng, Yifan and Yue, Xiang and Yang, Chao-Han Huck and Neubig, Graham and Watanabe, Shinji", editor = "Dziri, Nouha and Ren, Sean (Xiang) and Diao, Shizhe", booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (System Demonstrations)", month = apr, year = "2025", address = "Albuquerque, New Mexico", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2025.naacl-demo.12/", pages = "116--124", ISBN = "979-8-89176-191-9" }