@inproceedings{muradoglu-etal-2020-compress,
title = "To compress or not to compress? A Finite-State approach to {N}en verbal morphology",
author = "Muradoglu, Saliha and
Evans, Nicholas and
Suominen, Hanna",
editor = "Rijhwani, Shruti and
Liu, Jiangming and
Wang, Yizhong and
Dror, Rotem",
booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics: Student Research Workshop",
month = jul,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Author-page-Marten-During-lu/2020.acl-srw.28/",
doi = "10.18653/v1/2020.acl-srw.28",
pages = "207--213",
abstract = "This paper describes the development of a verbal morphological parser for an under-resourced Papuan language, Nen. Nen verbal morphology is particularly complex, with a transitive verb taking up to 1,740 unique features. The structural properties exhibited by Nen verbs raises interesting choices for analysis. Here we compare two possible methods of analysis: {\textquoteleft}Chunking' and decomposition. {\textquoteleft}Chunking' refers to the concept of collating morphological segments into one, whereas the decomposition model follows a more classical linguistic approach. Both models are built using the Finite-State Transducer toolkit foma. The resultant architecture shows differences in size and structural clarity. While the {\textquoteleft}Chunking' model is under half the size of the full de-composed counterpart, the decomposition displays higher structural order. In this paper, we describe the challenges encountered when modelling a language exhibiting distributed exponence and present the first morphological analyser for Nen, with an overall accuracy of 80.3{\%}."
}
Markdown (Informal)
[To compress or not to compress? A Finite-State approach to Nen verbal morphology](https://preview.aclanthology.org/Author-page-Marten-During-lu/2020.acl-srw.28/) (Muradoglu et al., ACL 2020)
ACL