@inproceedings{badshah-sajjad-2025-reference, title = "Reference-Guided Verdict: {LLM}s-as-Judges in Automatic Evaluation of Free-Form {QA}", author = "Badshah, Sher and Sajjad, Hassan", editor = "Zhang, Chen and Allaway, Emily and Shen, Hua and Miculicich, Lesly and Li, Yinqiao and M'hamdi, Meryem and Limkonchotiwat, Peerat and Bai, Richard He and T.y.s.s., Santosh and Han, Sophia Simeng and Thapa, Surendrabikram and Rim, Wiem Ben", booktitle = "Proceedings of the 9th Widening NLP Workshop", month = nov, year = "2025", address = "Suzhou, China", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-emnlp/2025.winlp-main.37/", pages = "251--267", ISBN = "979-8-89176-351-7" }