@inproceedings{wang-etal-2021-input,
title = "Input Representations for Parsing Discourse Representation Structures: Comparing {E}nglish with {C}hinese",
author = "Wang, Chunliu and
van Noord, Rik and
Bisazza, Arianna and
Bos, Johan",
editor = "Zong, Chengqing and
Xia, Fei and
Li, Wenjie and
Navigli, Roberto",
booktitle = "Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)",
month = aug,
year = "2021",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2021.acl-short.97/",
doi = "10.18653/v1/2021.acl-short.97",
pages = "767--775",
abstract = "Neural semantic parsers have obtained acceptable results in the context of parsing DRSs (Discourse Representation Structures). In particular models with character sequences as input showed remarkable performance for English. But how does this approach perform on languages with a different writing system, like Chinese, a language with a large vocabulary of characters? Does rule-based tokenisation of the input help, and which granularity is preferred: characters, or words? The results are promising. Even with DRSs based on English, good results for Chinese are obtained. Tokenisation offers a small advantage for English, but not for Chinese. Overall, characters are preferred as input, both for English and Chinese."
}
Markdown (Informal)
[Input Representations for Parsing Discourse Representation Structures: Comparing English with Chinese](https://preview.aclanthology.org/fix-sig-urls/2021.acl-short.97/) (Wang et al., ACL-IJCNLP 2021)
ACL