@inproceedings{wang-etal-2025-evaluating, title = "Evaluating {LLM}s with Multiple Problems at once", author = "Wang, Zhengxiang and Kodner, Jordan and Rambow, Owen", editor = "Dhole, Kaustubh and Clinciu, Miruna", booktitle = "Proceedings of the Fourth Workshop on Generation, Evaluation and Metrics (GEM{\texttwosuperior})", month = jul, year = "2025", address = "Vienna, Austria and virtual meeting", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/transition-to-people-yaml/2025.gem-1.14/", pages = "178--199", ISBN = "979-8-89176-261-9" }