@inproceedings{gaustad-etal-2024-first,
title = "The First {U}niversal {D}ependency Treebank for {T}swana: {T}swana-Popapolelo",
author = "Gaustad, Tanja and
Berg, Ansu and
Pretorius, Rigardt and
Eiselen, Roald",
editor = "Mabuya, Rooweither and
Matfunjwa, Muzi and
Setaka, Mmasibidi and
van Zaanen, Menno",
booktitle = "Proceedings of the Fifth Workshop on Resources for African Indigenous Languages @ LREC-COLING 2024",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.rail-1.7/",
pages = "55--65",
abstract = "This paper presents the first publicly available UD treebank for Tswana, Tswana-Popapolelo. The data used consists of the 20 Cairo CICLing sentences translated to Tswana. After pre-processing these sentences with detailed POS (XPOS) and converting them to universal POS (UPOS), we proceeded to annotate the data with dependency relations, documenting decisions for the language specific constructions. Linguistic issues encountered are described in detail as this is the first application of the UD framework to produce a dependency treebank for the Bantu language family in general and for Tswana specifically."
}
Markdown (Informal)
[The First Universal Dependency Treebank for Tswana: Tswana-Popapolelo](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.rail-1.7/) (Gaustad et al., RAIL 2024)
ACL