@inproceedings{miao-etal-2026-adajudge,
title = "{A}da{J}udge: Adaptive Multi-Perspective Judging for Reward Modeling",
author = "Miao, Yongliang and
Liang, Yangyang and
Du, Mengnan",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.440/",
pages = "9712--9724",
ISBN = "979-8-89176-390-6",
abstract = "Reward modeling is essential for aligning large language models with human preferences, yet predominant architectures rely on a static pooling strategy to condense sequences into scalar scores. This paradigm, however, suffers from two key limitations: a static inductive bias that misaligns with the task-dependent preference signals, and a representational mismatch, as the backbone{'}s optimization for generation leaves its representations ill-suited to fine-grained discrimination. To address this, we propose AdaJudge, a unified framework that jointly adapts representation and aggregation. AdaJudge first improves backbone representations into a discrimination-oriented space via gated refinement blocks. It then replaces the static readout with an adaptive multi-view pooling module, which dynamically routes and combines evidence. Extensive experiments on RM-Bench and JudgeBench show that AdaJudge outperforms strong off-the-shelf reward models and traditional pooling baselines."
}Markdown (Informal)
[AdaJudge: Adaptive Multi-Perspective Judging for Reward Modeling](https://preview.aclanthology.org/ingest-acl/2026.acl-long.440/) (Miao et al., ACL 2026)
ACL
- Yongliang Miao, Yangyang Liang, and Mengnan Du. 2026. AdaJudge: Adaptive Multi-Perspective Judging for Reward Modeling. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 9712–9724, San Diego, California, United States. Association for Computational Linguistics.