@inproceedings{alshenaifi-azmi-2022-arabic,
title = "{A}rabic dialect identification using machine learning and transformer-based models: Submission to the {NADI} 2022 Shared Task",
author = "AlShenaifi, Nouf and
Azmi, Aqil",
editor = "Bouamor, Houda and
Al-Khalifa, Hend and
Darwish, Kareem and
Rambow, Owen and
Bougares, Fethi and
Abdelali, Ahmed and
Tomeh, Nadi and
Khalifa, Salam and
Zaghouani, Wajdi",
booktitle = "Proceedings of the Seventh Arabic Natural Language Processing Workshop (WANLP)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.wanlp-1.50/",
doi = "10.18653/v1/2022.wanlp-1.50",
pages = "464--467",
abstract = "Arabic has a wide range of dialects. Dialect is the language variation of a specific community. In this paper, we show the models we created to participate in the third Nuanced Arabic Dialect Identification (NADI) shared task (Subtask 1) that involves developing a system to classify a tweet into a country-level dialect. We utilized a number of machine learning techniques as well as deep learning transformer-based models. For the machine learning approach, we build an ensemble classifier of various machine learning models. In our deep learning approach, we consider bidirectional LSTM model and AraBERT pretrained model. The results demonstrate that the deep learning approach performs noticeably better than the other machine learning approaches with 68.7{\%} accuracy on the development set."
}
Markdown (Informal)
[Arabic dialect identification using machine learning and transformer-based models: Submission to the NADI 2022 Shared Task](https://preview.aclanthology.org/add-emnlp-2024-awards/2022.wanlp-1.50/) (AlShenaifi & Azmi, WANLP 2022)
ACL