@inproceedings{nallani-etal-2020-fully,
title = "A Fully Expanded Dependency Treebank for {T}elugu",
author = "Nallani, Sneha and
Shrivastava, Manish and
Sharma, Dipti",
editor = "Jha, Girish Nath and
Bali, Kalika and
L., Sobha and
Agrawal, S. S. and
Ojha, Atul Kr.",
booktitle = "Proceedings of the WILDRE5{--} 5th Workshop on Indian Language Data: Resources and Evaluation",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/fix-sig-urls/2020.wildre-1.8/",
pages = "39--44",
language = "eng",
ISBN = "979-10-95546-67-2",
abstract = "Treebanks are an essential resource for syntactic parsing. The available Paninian dependency treebank(s) for Telugu is annotated only with inter-chunk dependency relations and not all words of a sentence are part of the parse tree. In this paper, we automatically annotate the intra-chunk dependencies in the treebank using a Shift-Reduce parser based on Context Free Grammar rules for Telugu chunks. We also propose a few additional intra-chunk dependency relations for Telugu apart from the ones used in Hindi treebank. Annotating intra-chunk dependencies finally provides a complete parse tree for every sentence in the treebank. Having a fully expanded treebank is crucial for developing end to end parsers which produce complete trees. We present a fully expanded dependency treebank for Telugu consisting of 3220 sentences. In this paper, we also convert the treebank annotated with Anncorra part-of-speech tagset to the latest BIS tagset. The BIS tagset is a hierarchical tagset adopted as a unified part-of-speech standard across all Indian Languages. The final treebank is made publicly available."
}
Markdown (Informal)
[A Fully Expanded Dependency Treebank for Telugu](https://preview.aclanthology.org/fix-sig-urls/2020.wildre-1.8/) (Nallani et al., WILDRE 2020)
ACL
- Sneha Nallani, Manish Shrivastava, and Dipti Sharma. 2020. A Fully Expanded Dependency Treebank for Telugu. In Proceedings of the WILDRE5– 5th Workshop on Indian Language Data: Resources and Evaluation, pages 39–44, Marseille, France. European Language Resources Association (ELRA).