@inproceedings{kranti-etal-2025-test, title = "Test Set Quality in Multilingual {LLM} Evaluation", author = "Kranti, Chalamalasetti and Bernier-Colborne, Gabriel and Gauthier, Yvan and Vajjala, Sowmya", editor = "Akter, Mousumi and Chowdhury, Tahiya and Eger, Steffen and Leiter, Christoph and Opitz, Juri and {\c{C}}ano, Erion", booktitle = "Proceedings of the 5th Workshop on Evaluation and Comparison of NLP Systems", month = dec, year = "2025", address = "Mumbai, India", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.eval4nlp-1.14/", pages = "167--178", ISBN = "979-8-89176-305-0" }