@inproceedings{li-etal-2026-evaluating-impact,
title = "Evaluating the Impact of Reviewer Guideline Design on {LLM}-Based Automated Peer Review",
author = "Li, Haowen and
Ishibashi, Yoichi and
Oyamada, Masafumi",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1511/",
pages = "30223--30240",
ISBN = "979-8-89176-395-1",
abstract = "Peer review is an essential process in scientific research, yet the growing workload has made its automation increasingly necessary. In this study, we analyze how different types of reviewer guidelines, such as official conference guidelines and reviewer-imitating ones distilled from high-quality human reviews, affect automated peer review. Our experiments show that official conference guidelines produce review results most consistent with human judgments, suggesting that evaluation criteria refined through conference practice serve as effective guidance for automated reviewing as well. In contrast, reviewer-imitating guidelines, especially those enforcing strict rubric-style scoring, consistently degraded automated review performance, highlighting the importance of allowing subjective and holistic scoring."
}Markdown (Informal)
[Evaluating the Impact of Reviewer Guideline Design on LLM-Based Automated Peer Review](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1511/) (Li et al., Findings 2026)
ACL