@inproceedings{deng-etal-2026-decoupling,
title = "Decoupling Task-Solving and Output Formatting in {LLM} Generation",
author = "Deng, Haikang and
Kung, Po-Nien and
Peng, Nanyun",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.764/",
pages = "16764--16781",
ISBN = "979-8-89176-390-6",
abstract = "Large language models (LLMs) are increasingly adept at solving complex problems, such as mathematical reasoning and automatic evaluation. However, performance often degrades when prompts intertwine task instructions with rigid formatting requirements. This entanglement creates competing goals for the model, hindering its reasoning capabilities. To address this, we introduce Deco-G, a decoding framework that explicitly decouples format adherence from problem solving. Deco-G delegates format adherence to a separate Format Estimation Module (FEM), which performs probabilistic lookahead to estimate future format compliance rate and reweighs token probabilities, allowing the LLM to focus solely on task resolution. To make this approach both practical and efficient, we introduce three key innovations: instruction-aware distillation, a flexible trie-building algorithm, and HMM state pruning. Experiments across mathematical reasoning, event argument extraction, and LLM-as-a-judge demonstrate that Deco-G constantly gains over prompting or structured generation baselines, with guaranteed format compliance."
}Markdown (Informal)
[Decoupling Task-Solving and Output Formatting in LLM Generation](https://preview.aclanthology.org/ingest-acl/2026.acl-long.764/) (Deng et al., ACL 2026)
ACL
- Haikang Deng, Po-Nien Kung, and Nanyun Peng. 2026. Decoupling Task-Solving and Output Formatting in LLM Generation. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 16764–16781, San Diego, California, United States. Association for Computational Linguistics.