@inproceedings{salama-etal-2014-youdacc,
title = "{Y}ou{DACC}: the {Y}outube Dialectal {A}rabic Comment Corpus",
author = "Salama, Ahmed and
Bouamor, Houda and
Mohit, Behrang and
Oflazer, Kemal",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Declerck, Thierry and
Loftsson, Hrafn and
Maegaard, Bente and
Mariani, Joseph and
Moreno, Asuncion and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Ninth International Conference on Language Resources and Evaluation ({LREC}'14)",
month = may,
year = "2014",
address = "Reykjavik, Iceland",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/fix-sig-urls/L14-1456/",
pages = "1246--1251",
abstract = "This paper presents YOUDACC, an automatically annotated large-scale multi-dialectal Arabic corpus collected from user comments on Youtube videos. Our corpus covers different groups of dialects: Egyptian (EG), Gulf (GU), Iraqi (IQ), Maghrebi (MG) and Levantine (LV). We perform an empirical analysis on the crawled corpus and demonstrate that our location-based proposed method is effective for the task of dialect labeling."
}
Markdown (Informal)
[YouDACC: the Youtube Dialectal Arabic Comment Corpus](https://preview.aclanthology.org/fix-sig-urls/L14-1456/) (Salama et al., LREC 2014)
ACL
- Ahmed Salama, Houda Bouamor, Behrang Mohit, and Kemal Oflazer. 2014. YouDACC: the Youtube Dialectal Arabic Comment Corpus. In Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14), pages 1246–1251, Reykjavik, Iceland. European Language Resources Association (ELRA).