@inproceedings{barbaresi-lejeune-2020-box, title = "Out-of-the-Box and into the Ditch? Multilingual Evaluation of Generic Text Extraction Tools", author = {Barbaresi, Adrien and Lejeune, Ga{\"e}l}, editor = {Barbaresi, Adrien and Bildhauer, Felix and Sch{\"a}fer, Roland and Stemle, Egon}, booktitle = "Proceedings of the 12th Web as Corpus Workshop", month = may, year = "2020", address = "Marseille, France", publisher = "European Language Resources Association", url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2020.wac-1.2/", pages = "5--13", language = "eng", ISBN = "979-10-95546-68-9" }