@inproceedings{swain-etal-2024-mitigating,
title = "On Mitigating Performance Disparities in Multilingual Speech Recognition",
author = "Swain, Monorama and
Zee, Anna Katrine Van and
S{\o}gaard, Anders",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.emnlp-main.323/",
doi = "10.18653/v1/2024.emnlp-main.323",
pages = "5647--5655",
abstract = "How far have we come in mitigating performance disparities across genders in multilingual speech recognition? We compare the impact on gender disparity of different fine-tuning algorithms for automated speech recognition across model sizes, languages and gender. We look at both performance-focused and fairness-promoting algorithms. Across languages, we see slightly better performance for female speakers for larger models regardless of the fine-tuning algorithm. The best trade-off between performance and parity is found using adapter fusion. Fairness-promoting fine-tuning algorithms (Group-DRO and Spectral Decoupling) hurt performance compared to adapter fusion with only slightly better performance parity. LoRA increases disparities slightly. Fairness-mitigating fine-tuning techniques led to slightly higher variance in performance across languages, with the exception of adapter fusion."
}
Markdown (Informal)
[On Mitigating Performance Disparities in Multilingual Speech Recognition](https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.emnlp-main.323/) (Swain et al., EMNLP 2024)
ACL