@inproceedings{nayel-etal-2021-machine,
title = "Machine Learning-Based Approach for {A}rabic Dialect Identification",
author = "Nayel, Hamada and
Hassan, Ahmed and
Sobhi, Mahmoud and
El-Sawy, Ahmed",
editor = "Habash, Nizar and
Bouamor, Houda and
Hajj, Hazem and
Magdy, Walid and
Zaghouani, Wajdi and
Bougares, Fethi and
Tomeh, Nadi and
Abu Farha, Ibrahim and
Touileb, Samia",
booktitle = "Proceedings of the Sixth Arabic Natural Language Processing Workshop",
month = apr,
year = "2021",
address = "Kyiv, Ukraine (Virtual)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2021.wanlp-1.34/",
pages = "287--290",
abstract = {This paper describes our systems submitted to the Second Nuanced Arabic Dialect Identification Shared Task (NADI 2021). Dialect identification is the task of automatically detecting the source variety of a given text or speech segment. There are four subtasks, two subtasks for country-level identification and the other two subtasks for province-level identification. The data in this task covers a total of 100 provinces from all 21 Arab countries and come from the Twitter domain. The proposed systems depend on five machine-learning approaches namely Complement Na{\"i}ve Bayes, Support Vector Machine, Decision Tree, Logistic Regression and Random Forest Classifiers. F1 macro-averaged score of Na{\"i}ve Bayes classifier outperformed all other classifiers for development and test data.}
}
Markdown (Informal)
[Machine Learning-Based Approach for Arabic Dialect Identification](https://preview.aclanthology.org/jlcl-multiple-ingestion/2021.wanlp-1.34/) (Nayel et al., WANLP 2021)
ACL