@inproceedings{samil-adelani-2026-sudanese,
title = "Sudanese-{F}lores: Extending {FLORES}+ to {S}udanese {A}rabic Dialect",
author = "Samil, Hadia Mohmmedosman Ahmed and
Adelani, David Ifeoluwa",
editor = "Chimoto, Everlyn Asiko and
Lignos, Constantine and
Muhammad, Shamsuddeen and
Abdulmumin, Idris and
Siro, Clemencia and
Adelani, David Ifeoluwa",
booktitle = "Proceedings of the 7th Workshop on {A}frican Natural Language Processing ({A}frica{NLP} 2026)",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/manual-author-scripts/2026.africanlp-main.25/",
pages = "243--247",
ISBN = "979-8-89176-364-7",
abstract = "In this work, we introduce Sudanese-Flores, an extension of the popular Flores+ machine translation (MT) benchmark to the Sudanese Arabic dialect. We translate both the DEV and DEVTEST splits of the Modern Standard Arabic dataset into the corresponding Sudanese dialect, resulting in a total of 2,009 sentences. While the dialect was recently introduced in Google Translate, there are no available benchmark in this dialect despite spoken by over 40 million people. Our evaluation on two leading LLMs such as GPT-4.1 and Gemini 2.5 Flash showed that while the performance English to Arabic is impressive (more than 23 BLEU), they struggle on Sudanese dialect (less than 11 BLEU) in zero-shot settings. In few-shot scenario, we achieved only a slight boost in performance."
}Markdown (Informal)
[Sudanese-Flores: Extending FLORES+ to Sudanese Arabic Dialect](https://preview.aclanthology.org/manual-author-scripts/2026.africanlp-main.25/) (Samil & Adelani, AfricaNLP 2026)
ACL