@inproceedings{kathuria-kumar-2026-leveraging,
title = "Leveraging Pretrained Language Models as Energy Functions for Glauber Dynamics Text Diffusion",
author = "Kathuria, Tarun and
Kumar, Sachin",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.2117/",
pages = "42625--42643",
ISBN = "979-8-89176-395-1",
abstract = "We present a discrete diffusion-based generative model for text generation using Glauber dynamics from statistical physics. Our main insight is that instead of trying to train a discrete state space diffusion model using Glauber dynamics with a uniform transition kernel as the forward process, one can set up an ``energy function'' based on pretrained causal/masked language models, which, when viewed as the stationary distribution, allows us to significantly improve the quality of the generated text. Using UL2 as our pretrained models and modifying and incorporating it into our diffusion pipeline, we obtain significantly better perplexities than prior diffusion-based text generative models and are competitive with the perplexities of GPT-2-medium and GPT-2-large for comparable model sizes. Furthermore, our models outperform prior diffusion models and GPT-2 style auto-regressive models on some zero-shot common sense reasoning tasks as well as some planning/search tasks."
}Markdown (Informal)
[Leveraging Pretrained Language Models as Energy Functions for Glauber Dynamics Text Diffusion](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.2117/) (Kathuria & Kumar, Findings 2026)
ACL