@inproceedings{karout-etal-2026-arabic,
title = "{A}rabic Citation Parsing using Part of Speech and Named Entity Recognition",
author = "Karout, Youssef and
Hammoud, Hadi and
Zaraket, Fadi",
booktitle = "Proceedings of the 2nd Workshop on {NLP} for Languages Using {A}rabic Script",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/manual-author-scripts/2026.abjadnlp-1.33/",
pages = "245--252",
abstract = "This paper introduces an industry level citation element extractor from Arabic text. Citation element extraction enables editorial task automation for publishing houses, creation of citation networks, and automatic citation analytics for impact analysis firms. Citation library tools help users manage their citations. However, for Arabic, these tools lack basic support to identify and extract citation elements. Consequently, researchers, editors and reviewers manually manage Arabic citations tasks. We present a novel Arabic citation element dataset, use it to train a citation element extraction model, and use named entity recognition, morphological analysis, and keyword detection to improve the results for practical use. The paper reports industry ready performance with F1 scores ranging between .80 and .95 for interesting citation elements."
}Markdown (Informal)
[Arabic Citation Parsing using Part of Speech and Named Entity Recognition](https://preview.aclanthology.org/manual-author-scripts/2026.abjadnlp-1.33/) (Karout et al., AbjadNLP 2026)
ACL