@inproceedings{pugh-etal-2024-wav2pos,
title = "Wav2pos: Exploring syntactic analysis from audio for {H}ighland {P}uebla {N}ahuatl",
author = "Pugh, Robert and
Sreedhar, Varun and
Tyers, Francis",
editor = "Mager, Manuel and
Ebrahimi, Abteen and
Rijhwani, Shruti and
Oncevay, Arturo and
Chiruzzo, Luis and
Pugh, Robert and
von der Wense, Katharina",
booktitle = "Proceedings of the 4th Workshop on Natural Language Processing for Indigenous Languages of the Americas (AmericasNLP 2024)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.americasnlp-1.13/",
doi = "10.18653/v1/2024.americasnlp-1.13",
pages = "121--126",
abstract = "We describe an approach to part-of-speech tagging from audio with very little human-annotated data, for Highland Puebla Nahuatl, a low-resource language of Mexico. While automatic morphosyntactic analysis is typically trained on annotated textual data, large amounts of text is rarely available for low-resource, marginalized, and/or minority languages, and morphosyntactically-annotated data is even harder to come by. Much of the data from these languages may exist in the form of recordings, often only partially-transcribed or analyzed by field linguists working on language documentation projects. Given this relatively low-availability of text in the low-resource language scenario, we explore end-to-end automated morphosyntactic analysis directly from audio. The experiments described in this paper focus on one piece of morphosyntax, part-of-speech tagging, and builds on existing work in a high-resource setting. We use weak supervision to increase training volume, and explore a few techniques for generating word-level predictions from the acoustic features. Our experiments show promising results, despite less than 400 sentences of audio-aligned, manually-labeled text."
}
Markdown (Informal)
[Wav2pos: Exploring syntactic analysis from audio for Highland Puebla Nahuatl](https://preview.aclanthology.org/fix-sig-urls/2024.americasnlp-1.13/) (Pugh et al., AmericasNLP 2024)
ACL