@inproceedings{hou-li-2024-character,
title = "Character-Level {C}hinese Dependency Parsing via Modeling Latent Intra-Word Structure",
author = "Hou, Yang and
Li, Zhenghua",
editor = "Ku, Lun-Wei and
Martins, Andre and
Srikumar, Vivek",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2024",
month = aug,
year = "2024",
address = "Bangkok, Thailand",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-acl.173/",
doi = "10.18653/v1/2024.findings-acl.173",
pages = "2943--2956",
abstract = "Revealing the syntactic structure of sentences in Chinese poses significant challenges for word-level parsers due to the absence of clear word boundaries. To facilitate a transition from word-level to character-level Chinese dependency parsing, this paper proposes modeling latent internal structures within words. In this way, each word-level dependency tree is interpreted as a forest of character-level trees. A constrained Eisner algorithm is implemented to ensure the compatibility of character-level trees, guaranteeing a single root for intra-word structures and establishing inter-word dependencies between these roots. Experiments on Chinese treebanks demonstrate the superiority of our method over both the pipeline framework and previous joint models. A detailed analysis reveals that a coarse-to-fine parsing strategy empowers the model to predict more linguistically plausible intra-word structures."
}
Markdown (Informal)
[Character-Level Chinese Dependency Parsing via Modeling Latent Intra-Word Structure](https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-acl.173/) (Hou & Li, Findings 2024)
ACL