@inproceedings{zhou-etal-2026-dos,
title = "{DOS}: Dependency-Oriented Sampler for Masked Diffusion Language Models",
author = "Zhou, Xueyu and
Hu, Yangrong and
Huang, Jian",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.861/",
pages = "17404--17419",
ISBN = "979-8-89176-395-1",
abstract = "Masked diffusion language models (MDLMs) have recently emerged as a new paradigm in language modeling, offering flexible generation dynamics and enabling efficient parallel decoding. However, existing decoding strategies for pre-trained MDLMs predominantly rely on token-level uncertainty criteria, while largely overlooking sequence-level information and inter-token dependencies. To address this limitation, we propose \textbf{D}ependency-\textbf{O}riented \textbf{S}ampler (DOS), a training-free decoding strategy that leverages inter-token dependencies to inform token updates during generation. Specifically, DOS exploits attention matrices from transformer blocks to approximate inter-token dependencies, emphasizing information from unmasked tokens when updating masked positions. Empirical results demonstrate that DOS consistently achieves superior performance on both code generation and mathematical reasoning tasks. Moreover, DOS can be seamlessly integrated with existing parallel sampling methods, leading to improved generation efficiency without sacrificing generation quality."
}Markdown (Informal)
[DOS: Dependency-Oriented Sampler for Masked Diffusion Language Models](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.861/) (Zhou et al., Findings 2026)
ACL