@inproceedings{gevers-etal-2025-benchmarks, title = "In Benchmarks We Trust ... Or Not?", author = "Gevers, Ine and De Marez, Victor and Van Nooten, Jens and Lemmens, Jens and Kosar, Andriy and Lotfi, Ehsan and Banar, Nikolay and Fivez, Pieter and De Bruyne, Luna and Daelemans, Walter", editor = "Christodoulopoulos, Christos and Chakraborty, Tanmoy and Rose, Carolyn and Peng, Violet", booktitle = "Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-emnlp/2025.emnlp-main.1208/", pages = "23673--23687", ISBN = "979-8-89176-332-6" }