@inproceedings{abdul-rauf-hira-2023-development,
title = "Development of {U}rdu-{E}nglish Religious Domain Parallel Corpus",
author = "Abdul Rauf, Sadaf and
Hira, Noor e",
booktitle = "Proceedings of the Second Workshop on Corpus Generation and Corpus Augmentation for Machine Translation",
month = sep,
year = "2023",
address = "Macau SAR, China",
publisher = "Asia-Pacific Association for Machine Translation",
url = "https://aclanthology.org/2023.mtsummit-coco4mt.2",
pages = "14--21",
abstract = "Despite the abundance of monolingual corpora accessible online, there remains a scarcity of domain specific parallel corpora. This scarcity poses a challenge in the development of robust translation systems tailored for such specialized domains. Addressing this gap, we have developed a parallel religious domain corpus for Urdu-English. This corpus consists of 18,426 parallel sentences from Sunan Daud, carefully curated to capture the unique linguistic and contextual aspects of religious texts. The developed corpus is then used to train Urdu-English religious domain Neural Machine Translation (NMT) systems, the best system scored 27.9 BLEU points",
}
Markdown (Informal)
[Development of Urdu-English Religious Domain Parallel Corpus](https://aclanthology.org/2023.mtsummit-coco4mt.2) (Abdul Rauf & Hira, MTSummit 2023)
ACL