@inproceedings{singh-hakkani-t-ur-2026-llms,
title = "Do {LLM}s Encode Functional Importance of Reasoning Tokens ?",
author = "Singh, Janvijay and
Hakkani-T{\textbackslash}{''}ur, Dilek",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1419/",
pages = "30749--30773",
ISBN = "979-8-89176-390-6",
abstract = "Large language models solve complex tasks by generating long reasoning chains, achieving higher accuracy at the cost of increased computational cost and reduced ability to isolate functionally relevant reasoning. Prior work on compact reasoning shortens such chains through probabilistic sampling, heuristics, or supervision from frontier models, but offers limited insight into whether models internally encode token-level functional importance for answer generation. We address this gap diagnostically and propose greedy pruning, a likelihood-preserving deletion procedure that iteratively removes reasoning tokens whose removal minimally degrades model likelihood under a specified objective, yielding length-controlled reasoning chains. We evaluate pruned reasoning in a distillation framework and show that students trained on pruned chains outperform a frontier-model{--}supervised compression baseline at matched reasoning lengths. Finally, our analysis reveals systematic pruning patterns and shows that attention scores can predict greedy pruning ranks, further suggesting that models encode a nontrivial functional importance structure over reasoning tokens."
}Markdown (Informal)
[Do LLMs Encode Functional Importance of Reasoning Tokens ?](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1419/) (Singh & Hakkani-T\"ur, ACL 2026)
ACL
- Janvijay Singh and Dilek Hakkani-T\"ur. 2026. Do LLMs Encode Functional Importance of Reasoning Tokens ?. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 30749–30773, San Diego, California, United States. Association for Computational Linguistics.