@inproceedings{karpinska-etal-2018-subcharacter,
title = "Subcharacter Information in {J}apanese Embeddings: When Is It Worth It?",
author = "Karpinska, Marzena and
Li, Bofang and
Rogers, Anna and
Drozd, Aleksandr",
editor = "Dinu, Georgiana and
Ballesteros, Miguel and
Sil, Avirup and
Bowman, Sam and
Hamza, Wael and
Sogaard, Anders and
Naseem, Tahira and
Goldberg, Yoav",
booktitle = "Proceedings of the Workshop on the Relevance of Linguistic Structure in Neural Architectures for {NLP}",
month = jul,
year = "2018",
address = "Melbourne, Australia",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/W18-2905/",
doi = "10.18653/v1/W18-2905",
pages = "28--37",
abstract = "Languages with logographic writing systems present a difficulty for traditional character-level models. Leveraging the subcharacter information was recently shown to be beneficial for a number of intrinsic and extrinsic tasks in Chinese. We examine whether the same strategies could be applied for Japanese, and contribute a new analogy dataset for this language."
}
Markdown (Informal)
[Subcharacter Information in Japanese Embeddings: When Is It Worth It?](https://preview.aclanthology.org/jlcl-multiple-ingestion/W18-2905/) (Karpinska et al., ACL 2018)
ACL