@inproceedings{wang-etal-2025-prosodyflow, title = "{P}rosody{F}low: High-fidelity Text-to-Speech through Conditional Flow Matching and Prosody Modeling with Large Speech Language Models", author = "Wang, Haoyu and Shan, Sizhe and Guo, Yinlin and Wang, Yuehai", editor = "Rambow, Owen and Wanner, Leo and Apidianaki, Marianna and Al-Khalifa, Hend and Eugenio, Barbara Di and Schockaert, Steven", booktitle = "Proceedings of the 31st International Conference on Computational Linguistics", month = jan, year = "2025", address = "Abu Dhabi, UAE", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2025.coling-main.518/", pages = "7748--7753" }