@inproceedings{hatagaki-etal-2022-parallel,
title = "Parallel Corpus Filtering for {J}apanese Text Simplification",
author = "Hatagaki, Koki and
Kajiwara, Tomoyuki and
Ninomiya, Takashi",
editor = "{\v{S}}tajner, Sanja and
Saggion, Horacio and
Ferr{\'e}s, Daniel and
Shardlow, Matthew and
Sheang, Kim Cheng and
North, Kai and
Zampieri, Marcos and
Xu, Wei",
booktitle = "Proceedings of the Workshop on Text Simplification, Accessibility, and Readability (TSAR-2022)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Virtual)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.tsar-1.2",
doi = "10.18653/v1/2022.tsar-1.2",
pages = "12--18",
abstract = "We propose a method of parallel corpus filtering for Japanese text simplification. The parallel corpus for this task contains some redundant wording. In this study, we first identify the type and size of noisy sentence pairs in the Japanese text simplification corpus. We then propose a method of parallel corpus filtering to remove each type of noisy sentence pair. Experimental results show that filtering the training parallel corpus with the proposed method improves simplification performance.",
}
Markdown (Informal)
[Parallel Corpus Filtering for Japanese Text Simplification](https://aclanthology.org/2022.tsar-1.2) (Hatagaki et al., TSAR 2022)
ACL
- Koki Hatagaki, Tomoyuki Kajiwara, and Takashi Ninomiya. 2022. Parallel Corpus Filtering for Japanese Text Simplification. In Proceedings of the Workshop on Text Simplification, Accessibility, and Readability (TSAR-2022), pages 12–18, Abu Dhabi, United Arab Emirates (Virtual). Association for Computational Linguistics.