@inproceedings{hartmann-etal-2020-simplex,
title = "{SIMPLEX}-{PB} 2.0: A Reliable Dataset for Lexical Simplification in {B}razilian {P}ortuguese",
author = "Hartmann, Nathan and
Paetzold, Gustavo Henrique and
Alu{\'i}sio, Sandra",
editor = "Cunha, Rossana and
Shaikh, Samira and
Varis, Erika and
Georgi, Ryan and
Tsai, Alicia and
Anastasopoulos, Antonios and
Chandu, Khyathi Raghavi",
booktitle = "Proceedings of the Fourth Widening Natural Language Processing Workshop",
month = jul,
year = "2020",
address = "Seattle, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.winlp-1.6/",
doi = "10.18653/v1/2020.winlp-1.6",
pages = "18--22",
abstract = "Most research on Lexical Simplification (LS) addresses non-native speakers of English, since they are numerous and easy to recruit. This makes it difficult to create LS solutions for other languages and target audiences. This paper presents SIMPLEX-PB 2.0, a dataset for LS in Brazilian Portuguese that, unlike its predecessor SIMPLEX-PB, accurately captures the needs of Brazilian underprivileged children. To create SIMPLEX-PB 2.0, we addressed all limitations of the old SIMPLEX-PB through multiple rounds of manual annotation. As a result, SIMPLEX-PB 2.0 features much more reliable and numerous candidate substitutions to complex words, as well as word complexity rankings produced by a group underprivileged children."
}
Markdown (Informal)
[SIMPLEX-PB 2.0: A Reliable Dataset for Lexical Simplification in Brazilian Portuguese](https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.winlp-1.6/) (Hartmann et al., WiNLP 2020)
ACL