@inproceedings{li-etal-2023-cwseg,
title = "{CWS}eg: An Efficient and General Approach to {C}hinese Word Segmentation",
author = "Li, Dedong and
Zhao, Rui and
Tan, Fei",
editor = "Sitaram, Sunayana and
Beigman Klebanov, Beata and
Williams, Jason D",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 5: Industry Track)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-industry.1",
doi = "10.18653/v1/2023.acl-industry.1",
pages = "1--10",
abstract = "In this work, we report our efforts in advancing Chinese Word Segmentation for the purpose of rapid deployment in different applications. The pre-trained language model (PLM) based segmentation methods have achieved state-of-the-art (SOTA) performance, whereas this paradigm also poses challenges in the deployment. It includes the balance between performance and cost, segmentation ambiguity due to domain diversity and vague words boundary, and multi-grained segmentation. In this context, we propose a simple yet effective approach, namely CWSeg, to augment PLM-based schemes by developing cohort training and versatile decoding strategies. Extensive experiments on benchmark datasets demonstrate the efficiency and generalization of our approach. The corresponding segmentation system is also implemented for practical usage and the demo is recorded.",
}
Markdown (Informal)
[CWSeg: An Efficient and General Approach to Chinese Word Segmentation](https://aclanthology.org/2023.acl-industry.1) (Li et al., ACL 2023)
ACL