@inproceedings{boubdir-etal-2023-elo, title = "Elo Uncovered: Robustness and Best Practices in Language Model Evaluation", author = "Boubdir, Meriem and Kim, Edward and Ermis, Beyza and Hooker, Sara and Fadaee, Marzieh", editor = "Gehrmann, Sebastian and Wang, Alex and Sedoc, Jo{\~a}o and Clark, Elizabeth and Dhole, Kaustubh and Chandu, Khyathi Raghavi and Santus, Enrico and Sedghamiz, Hooman", booktitle = "Proceedings of the Third Workshop on Natural Language Generation, Evaluation, and Metrics (GEM)", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/sigedu-bea-out-of-sync-correction/2023.gem-1.28/", pages = "339--352" }