@inproceedings{wong-etal-2026-models,
title = "When Models Decide and When They Bind: A Two-Stage Computation for Multiple-Choice Question Answering",
author = "Wong, Hugh Mee and
Nouwen, Rick and
Gatt, Albert",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1144/",
pages = "22804--22821",
ISBN = "979-8-89176-395-1",
abstract = "Multiple-choice question answering (MCQA) is easy to evaluate but adds a meta-task: models must both solve the problem and output the symbol that represents the answer, conflating reasoning errors with symbol-binding failures. We study how language models implement MCQA internally using representational analyses (PCA, linear probes) as well as causal interventions. We find that option-boundary (newline) residual states often contain strong linearly decodable signals related to per-option correctness. Winner-identity probing reveals a two-stage progression: the winning content position becomes decodable immediately after the final option is processed, while the output symbol is represented closer to the answer emission position. Tests under symbol and content permutations support a two-stage mechanism in which models first select a winner in content space and then bind or route that winner to the appropriate symbol to emit."
}Markdown (Informal)
[When Models Decide and When They Bind: A Two-Stage Computation for Multiple-Choice Question Answering](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1144/) (Wong et al., Findings 2026)
ACL