@inproceedings{van-noord-etal-2024-language, title = "Do Language Models Care about Text Quality? Evaluating Web-Crawled Corpora across 11 Languages", author = "van Noord, Rik and Kuzman, Taja and Rupnik, Peter and Ljube{\v{s}}i{\'c}, Nikola and Espl{\`a}-Gomis, Miquel and Ram{\'i}rez-S{\'a}nchez, Gema and Toral, Antonio", editor = "Calzolari, Nicoletta and Kan, Min-Yen and Hoste, Veronique and Lenci, Alessandro and Sakti, Sakriani and Xue, Nianwen", booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)", month = may, year = "2024", address = "Torino, Italia", publisher = "ELRA and ICCL", url = "https://preview.aclanthology.org/fix-sig-urls/2024.lrec-main.465/", pages = "5221--5234" }