@inproceedings{masson-carson-berndsen-2023-investigating,
title = "Investigating Phoneme Similarity with Artificially Accented Speech",
author = "Masson, Margot and
Carson-berndsen, Julie",
editor = {Nicolai, Garrett and
Chodroff, Eleanor and
Mailhot, Frederic and
{\c{C}}{\"o}ltekin, {\c{C}}a{\u{g}}r{\i}},
booktitle = "Proceedings of the 20th SIGMORPHON workshop on Computational Research in Phonetics, Phonology, and Morphology",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2023.sigmorphon-1.6/",
doi = "10.18653/v1/2023.sigmorphon-1.6",
pages = "49--57",
abstract = "While the deep learning revolution has led to significant performance improvements in speech recognition, accented speech remains a challenge. Current approaches to this challenge typically do not seek to understand and provide explanations for the variations of accented speech, whether they stem from native regional variation or non-native error patterns. This paper seeks to address non-native speaker variations from both a knowledge-based and a data-driven perspective. We propose to approximate non-native accented-speech pronunciation patterns by the means of two approaches: based on phonetic and phonological knowledge on the one hand and inferred from a text-to-speech system on the other. Artificial speech is then generated with a range of variants which have been captured in confusion matrices representing phoneme similarities. We then show that non-native accent confusions actually propagate to the transcription from the ASR, thus suggesting that the inference of accent specific phoneme confusions is achievable from artificial speech."
}
Markdown (Informal)
[Investigating Phoneme Similarity with Artificially Accented Speech](https://preview.aclanthology.org/add-emnlp-2024-awards/2023.sigmorphon-1.6/) (Masson & Carson-berndsen, SIGMORPHON 2023)
ACL