@inproceedings{appiah-balaji-b-2020-semi,
title = "Semi-supervised Fine-grained Approach for {A}rabic dialect detection task",
author = "Appiah Balaji, Nitin Nikamanth and
B, Bharathi",
editor = "Zitouni, Imed and
Abdul-Mageed, Muhammad and
Bouamor, Houda and
Bougares, Fethi and
El-Haj, Mahmoud and
Tomeh, Nadi and
Zaghouani, Wajdi",
booktitle = "Proceedings of the Fifth Arabic Natural Language Processing Workshop",
month = dec,
year = "2020",
address = "Barcelona, Spain (Online)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.wanlp-1.25/",
pages = "257--261",
abstract = "Arabic being a language with numerous different dialects, it becomes extremely important to device a technique to distinguish each dialect efficiently. This paper focuses on the fine-grained country level and province level classification of Arabic dialects. The experiments in this paper are submissions done to the NADI 2020 shared Dialect detection task. Various text feature extraction techniques such as TF-IDF, AraVec, multilingual BERT and Fasttext embedding models are studied. We thereby, propose an approach of text embedding based model with macro average F1 score of 0.2232 for task1 and 0.0483 for task2, with the help of semi supervised learning approach."
}
Markdown (Informal)
[Semi-supervised Fine-grained Approach for Arabic dialect detection task](https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.wanlp-1.25/) (Appiah Balaji & B, WANLP 2020)
ACL