@inproceedings{mulki-etal-2019-syntax,
title = "Syntax-Ignorant N-gram Embeddings for Sentiment Analysis of {A}rabic Dialects",
author = "Mulki, Hala and
Haddad, Hatem and
Gridach, Mourad and
Babao{\u{g}}lu, Ismail",
editor = "El-Hajj, Wassim and
Belguith, Lamia Hadrich and
Bougares, Fethi and
Magdy, Walid and
Zitouni, Imed and
Tomeh, Nadi and
El-Haj, Mahmoud and
Zaghouani, Wajdi",
booktitle = "Proceedings of the Fourth Arabic Natural Language Processing Workshop",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/W19-4604/",
doi = "10.18653/v1/W19-4604",
pages = "30--39",
abstract = "Arabic sentiment analysis models have employed compositional embedding features to represent the Arabic dialectal content. These embeddings are usually composed via ordered, syntax-aware composition functions and learned within deep neural frameworks. With the free word order and the varying syntax nature across the different Arabic dialects, a sentiment analysis system developed for one dialect might not be efficient for the others. Here we present syntax-ignorant n-gram embeddings to be used in sentiment analysis of several Arabic dialects. The proposed embeddings were composed and learned using an unordered composition function and a shallow neural model. Five datasets of different dialects were used to evaluate the produced embeddings in the sentiment analysis task. The obtained results revealed that, our syntax-ignorant embeddings could outperform word2vec model and doc2vec both variant models in addition to hand-crafted system baselines, while a competent performance was noticed towards baseline systems that adopted more complicated neural architectures."
}
Markdown (Informal)
[Syntax-Ignorant N-gram Embeddings for Sentiment Analysis of Arabic Dialects](https://preview.aclanthology.org/jlcl-multiple-ingestion/W19-4604/) (Mulki et al., WANLP 2019)
ACL