@inproceedings{al-kharusi-aalabdulsalam-2023-machine,
title = "Machine Translation of {O}mani {A}rabic Dialect from Social Media",
author = "Al-Kharusi, Khoula and
AAlAbdulsalam, Abdurahman",
editor = "Sawaf, Hassan and
El-Beltagy, Samhaa and
Zaghouani, Wajdi and
Magdy, Walid and
Abdelali, Ahmed and
Tomeh, Nadi and
Abu Farha, Ibrahim and
Habash, Nizar and
Khalifa, Salam and
Keleg, Amr and
Haddad, Hatem and
Zitouni, Imed and
Mrini, Khalil and
Almatham, Rawan",
booktitle = "Proceedings of ArabicNLP 2023",
month = dec,
year = "2023",
address = "Singapore (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2023.arabicnlp-1.24/",
doi = "10.18653/v1/2023.arabicnlp-1.24",
pages = "302--309",
abstract = "Research studies on Machine Translation (MT) between Modern Standard Arabic (MSA) and English are abundant. However, studies on MT between Omani Arabic (OA) dialects and English are very scarce. This research study focuses on the lack of availability of an Omani dialect parallel dataset, as well as MT of OA to English. The study uses social media data from X (formerly Twitter) to build an authentic parallel text of the Omani dialects. The research presents baseline results on this dataset using Google Translate, Microsoft Translation, and Marian NMT. A taxonomy of the most common linguistic errors is used to analyze the translations made by the NMT systems to provide insights on future improvements. Finally, transfer learning is used to adapt Marian NMT to the Omani dialect, which significantly improved by 9.88 points in the BLEU score."
}
Markdown (Informal)
[Machine Translation of Omani Arabic Dialect from Social Media](https://preview.aclanthology.org/add-emnlp-2024-awards/2023.arabicnlp-1.24/) (Al-Kharusi & AAlAbdulsalam, ArabicNLP 2023)
ACL