@inproceedings{le-ferrand-etal-2024-modern,
title = "Are modern neural {ASR} architectures robust for polysynthetic languages?",
author = "Le Ferrand, Eric and
Liu, Zoey and
Arppe, Antti and
Prud{'}hommeaux, Emily",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2024",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-emnlp.166/",
doi = "10.18653/v1/2024.findings-emnlp.166",
pages = "2953--2963",
abstract = "Automatic speech recognition (ASR) technology is frequently proposed as a means of preservation and documentation of endangered languages, with promising results thus far. Among the endangered languages spoken today, a significant number exhibit complex morphology. The models employed in contemporary language documentation pipelines that utilize ASR, however, are predominantly based on isolating or inflectional languages, often from the Indo-European family. This raises a critical concern: building models exclusively on such languages may introduce a bias, resulting in better performance with simpler morphological structures. In this paper, we investigate the performance of modern ASR architectures on morphologically complex languages. Results indicate that modern ASR architectures appear less robust in managing high OOV rates for morphologically complex languages in terms of word error rate, while character error rates are consistently higher for isolating languages."
}
Markdown (Informal)
[Are modern neural ASR architectures robust for polysynthetic languages?](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-emnlp.166/) (Le Ferrand et al., Findings 2024)
ACL