@inproceedings{le-ferrand-etal-2024-enenlhet,
title = "Enenlhet as a case-study to investigate {ASR} model generalizability for language documentation",
author = "Le Ferrand, {\'E}ric and
Heaton, Raina and
Prud{'}hommeaux, Emily",
editor = "Mager, Manuel and
Ebrahimi, Abteen and
Rijhwani, Shruti and
Oncevay, Arturo and
Chiruzzo, Luis and
Pugh, Robert and
von der Wense, Katharina",
booktitle = "Proceedings of the 4th Workshop on Natural Language Processing for Indigenous Languages of the Americas (AmericasNLP 2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.americasnlp-1.15/",
doi = "10.18653/v1/2024.americasnlp-1.15",
pages = "132--137",
abstract = "Although both linguists and language community members recognize the potential utility of automatic speech recognition (ASR) for documentation, one of the obstacles to using these technologies is the scarcity of data necessary to train effective systems. Recent advances in ASR, particularly the ability to fine-tune large multilingual acoustic models to small amounts of data from a new language, have demonstrated the potential of ASR for transcription. However, many proof-of-concept demonstrations of ASR in low-resource settings rely on a single data collection project, which may yield models that are biased toward that particular data scenario, whether in content, recording quality, transcription conventions, or speaker population. In this paper, we investigate the performance of two state-of-the art ASR architectures for fine-tuning acoustic models to small speech datasets with the goal of transcribing recordings of Enenlhet, an endangered Indigenous language spoken in South America. Our results suggest that while ASR offers utility for generating first-pass transcriptions of speech collected in the course of linguistic fieldwork, individual vocabulary diversity and data quality have an outsized impact on ASR accuracy."
}
Markdown (Informal)
[Enenlhet as a case-study to investigate ASR model generalizability for language documentation](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.americasnlp-1.15/) (Le Ferrand et al., AmericasNLP 2024)
ACL