@inproceedings{daiber-van-der-goot-2016-denoised,
title = "The Denoised Web Treebank: Evaluating Dependency Parsing under Noisy Input Conditions",
author = "Daiber, Joachim and
van der Goot, Rob",
editor = "Calzolari, Nicoletta and
Choukri, Khalid and
Declerck, Thierry and
Goggi, Sara and
Grobelnik, Marko and
Maegaard, Bente and
Mariani, Joseph and
Mazo, Helene and
Moreno, Asuncion and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Tenth International Conference on Language Resources and Evaluation ({LREC}`16)",
month = may,
year = "2016",
address = "Portoro{\v{z}}, Slovenia",
publisher = "European Language Resources Association (ELRA)",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/L16-1102/",
pages = "649--653",
abstract = "We introduce the Denoised Web Treebank: a treebank including a normalization layer and a corresponding evaluation metric for dependency parsing of noisy text, such as Tweets. This benchmark enables the evaluation of parser robustness as well as text normalization methods, including normalization as machine translation and unsupervised lexical normalization, directly on syntactic trees. Experiments show that text normalization together with a combination of domain-specific and generic part-of-speech taggers can lead to a significant improvement in parsing accuracy on this test set."
}
Markdown (Informal)
[The Denoised Web Treebank: Evaluating Dependency Parsing under Noisy Input Conditions](https://preview.aclanthology.org/jlcl-multiple-ingestion/L16-1102/) (Daiber & van der Goot, LREC 2016)
ACL