@inproceedings{micallef-etal-2022-pre, title = "Pre-training Data Quality and Quantity for a Low-Resource Language: New Corpus and {BERT} Models for {M}altese", author = "Micallef, Kurt and Gatt, Albert and Tanti, Marc and van der Plas, Lonneke and Borg, Claudia", editor = "Cherry, Colin and Fan, Angela and Foster, George and Haffari, Gholamreza (Reza) and Khadivi, Shahram and Peng, Nanyun (Violet) and Ren, Xiang and Shareghi, Ehsan and Swayamdipta, Swabha", booktitle = "Proceedings of the Third Workshop on Deep Learning for Low-Resource Natural Language Processing", month = jul, year = "2022", address = "Hybrid", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.deeplo-1.10/", doi = "10.18653/v1/2022.deeplo-1.10", pages = "90--101" }