@inproceedings{tannander-etal-2024-revisiting,
title = "Revisiting Three Text-to-Speech Synthesis Experiments with a Web-Based Audience Response System",
author = "T{\r{a}}nnander, Christina and
Edlund, Jens and
Gustafson, Joakim",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.lrec-main.1230/",
pages = "14111--14121",
abstract = "In order to investigate the strengths and weaknesses of Audience Response System (ARS) in text-to-speech synthesis (TTS) evaluations, we revisit three previously published TTS studies and perform an ARS-based evaluation on the stimuli used in each study. The experiments are performed with a participant pool of 39 respondents, using a web-based tool that emulates an ARS experiment. The results of the first experiment confirms that ARS is highly useful for evaluating long and continuous stimuli, particularly if we wish for a diagnostic result rather than a single overall metric, while the second and third experiments highlight weaknesses in ARS with unsuitable materials as well as the importance of framing and instruction when conducting ARS-based evaluation."
}
Markdown (Informal)
[Revisiting Three Text-to-Speech Synthesis Experiments with a Web-Based Audience Response System](https://preview.aclanthology.org/fix-sig-urls/2024.lrec-main.1230/) (Tånnander et al., LREC-COLING 2024)
ACL