@inproceedings{kumar-etal-2024-beyond,
title = "Beyond Common Words: Enhancing {ASR} Cross-Lingual Proper Noun Recognition Using Large Language Models",
author = "Kumar, Rishabh and
Ghosh, Sabyasachi and
Ramakrishnan, Ganesh",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2024",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-emnlp.399/",
doi = "10.18653/v1/2024.findings-emnlp.399",
pages = "6821--6828",
abstract = "In this work, we address the challenge of cross-lingual proper noun recognition in automatic speech recognition (ASR), where proper nouns in an utterance may originate from a language different from the language in which the ASR system is trained. We enhance the performance of end-to-end ASR systems by instructing a large language model (LLM) to correct the ASR model`s predictions. The LLM`s context is augmented with a dictionary of cross-lingual words that are phonetically and graphemically similar to the potentially incorrect proper nouns in the ASR predictions. Our dictionary-based method DiP-ASR (Dictionary-based Prompting for Automatic Speech Recognition) significantly reduces word error rates compared to both the end-to-end ASR baseline and instruction-based prompting of the LLM without the dictionary across cross-lingual proper noun recognition tasks involving three secondary languages."
}
Markdown (Informal)
[Beyond Common Words: Enhancing ASR Cross-Lingual Proper Noun Recognition Using Large Language Models](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-emnlp.399/) (Kumar et al., Findings 2024)
ACL