@inproceedings{li-etal-2021-segmenting-natural,
title = "Segmenting Natural Language Sentences via Lexical Unit Analysis",
author = "Li, Yangming and
Liu, Lemao and
Shi, Shuming",
editor = "Moens, Marie-Francine and
Huang, Xuanjing and
Specia, Lucia and
Yih, Scott Wen-tau",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2021",
month = nov,
year = "2021",
address = "Punta Cana, Dominican Republic",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2021.findings-emnlp.18/",
doi = "10.18653/v1/2021.findings-emnlp.18",
pages = "181--187",
abstract = "The span-based model enjoys great popularity in recent works of sequence segmentation. However, each of these methods suffers from its own defects, such as invalid predictions. In this work, we introduce a unified span-based model, lexical unit analysis (LUA), that addresses all these matters. Segmenting a lexical unit sequence involves two steps. Firstly, we embed every span by using the representations from a pretraining language model. Secondly, we define a score for every segmentation candidate and apply dynamic programming (DP) to extract the candidate with the maximum score. We have conducted extensive experiments on 3 tasks, (e.g., syntactic chunking), across 7 datasets. LUA has established new state-of-the-art performances on 6 of them. We have achieved even better results through incorporating label correlations."
}
Markdown (Informal)
[Segmenting Natural Language Sentences via Lexical Unit Analysis](https://preview.aclanthology.org/landing_page/2021.findings-emnlp.18/) (Li et al., Findings 2021)
ACL