@inproceedings{jiang-etal-2026-cat,
title = "{CAT}: Confidence-Adaptive Thinking for Efficient Reasoning of Large Reasoning Models",
author = "Jiang, Qizhi and
Wang, Shuo and
Ke, Pei and
Song, Yuhang and
Qin, Ke",
editor = "Li, Yunyao and
Rehm, Georg and
Tu, Mei",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL} 2026)",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-industry.152/",
pages = "2271--2283",
ISBN = "979-8-89176-394-4",
abstract = "Large Reasoning Models (LRMs) have achieved remarkable success on complex tasks by leveraging long chain-of-thought (CoT) trajectories, yet they frequently exhibit overthinking on simple queries, resulting in significant token overhead and reduced inference efficiency. However, existing compression methods predominantly apply uniform length reduction or rely on coarse-grained difficulty estimation, often leading to performance degradation on difficult problems. To address this limitation, we propose Confidence-Adaptive Thinking (CAT), a framework that incorporates the model{'}s intrinsic self-certainty signals as confidence into the preference optimization process, which autonomously modulates reasoning lengths based on problem difficulty. Experimental results show that CAT consistently outperforms state-of-the-art baselines on reasoning accuracy across multiple benchmarks on different base models. Our work enables LRMs to effectively compress confident responses while deliberating on uncertain ones, offering a potentially robust solution for balancing accuracy and latency in practical industrial scenarios."
}Markdown (Informal)
[CAT: Confidence-Adaptive Thinking for Efficient Reasoning of Large Reasoning Models](https://preview.aclanthology.org/ingest-acl/2026.acl-industry.152/) (Jiang et al., ACL 2026)
ACL