@inproceedings{deshpande-etal-2025-multichallenge, title = "{M}ulti{C}hallenge: A Realistic Multi-Turn Conversation Evaluation Benchmark Challenging to Frontier {LLM}s", author = "Deshpande, Kaustubh and Sirdeshmukh, Ved and Mols, Johannes Baptist and Jin, Lifeng and Hernandez-Cardona, Ed-Yeremai and Lee, Dean and Kritz, Jeremy and Primack, Willow E. and Yue, Summer and Xing, Chen", editor = "Che, Wanxiang and Nabende, Joyce and Shutova, Ekaterina and Pilehvar, Mohammad Taher", booktitle = "Findings of the Association for Computational Linguistics: ACL 2025", month = jul, year = "2025", address = "Vienna, Austria", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/display_plenaries/2025.findings-acl.958/", pages = "18632--18702", ISBN = "979-8-89176-256-5" }