@inproceedings{shi-etal-2025-versa, title = "{VERSA}: A Versatile Evaluation Toolkit for Speech, Audio, and Music", author = "Shi, Jiatong and Shim, Hye-jin and Tian, Jinchuan and Arora, Siddhant and Wu, Haibin and Petermann, Darius and Yip, Jia Qi and Zhang, You and Tang, Yuxun and Zhang, Wangyou and Alharthi, Dareen Safar and Huang, Yichen and Saito, Koichi and Han, Jionghao and Zhao, Yiwen and Donahue, Chris and Watanabe, Shinji", editor = "Dziri, Nouha and Ren, Sean (Xiang) and Diao, Shizhe", booktitle = "Proceedings of the 2025 Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies (System Demonstrations)", month = apr, year = "2025", address = "Albuquerque, New Mexico", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2025.naacl-demo.19/", pages = "191--209", ISBN = "979-8-89176-191-9" }