@inproceedings{abo-mokh-etal-2022-improving,
title = "Improving {POS} Tagging for {A}rabic Dialects on Out-of-Domain Texts",
author = {Abo Mokh, Noor and
Dakota, Daniel and
K{\"u}bler, Sandra},
editor = "Bouamor, Houda and
Al-Khalifa, Hend and
Darwish, Kareem and
Rambow, Owen and
Bougares, Fethi and
Abdelali, Ahmed and
Tomeh, Nadi and
Khalifa, Salam and
Zaghouani, Wajdi",
booktitle = "Proceedings of the Seventh Arabic Natural Language Processing Workshop (WANLP)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.wanlp-1.22/",
doi = "10.18653/v1/2022.wanlp-1.22",
pages = "238--248",
abstract = "We investigate part of speech tagging for four Arabic dialects (Gulf, Levantine, Egyptian, and Maghrebi), in an out-of-domain setting. More specifically, we look at the effectiveness of 1) upsampling the target dialect in the training data of a joint model, 2) increasing the consistency of the annotations, and 3) using word embeddings pre-trained on a large corpus of dialectal Arabic. We increase the accuracy on average by about 20 percentage points."
}
Markdown (Informal)
[Improving POS Tagging for Arabic Dialects on Out-of-Domain Texts](https://preview.aclanthology.org/add-emnlp-2024-awards/2022.wanlp-1.22/) (Abo Mokh et al., WANLP 2022)
ACL