@inproceedings{lovelace-etal-2024-diffusion,
title = "Diffusion Guided Language Modeling",
author = "Lovelace, Justin and
Kishore, Varsha and
Chen, Yiwei and
Weinberger, Kilian",
editor = "Ku, Lun-Wei and
Martins, Andre and
Srikumar, Vivek",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2024",
month = aug,
year = "2024",
address = "Bangkok, Thailand",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-acl.887/",
doi = "10.18653/v1/2024.findings-acl.887",
pages = "14936--14952",
abstract = "Current language models demonstrate remarkable proficiency in text generation. However, for many applications it is desirable to control attributes, such as sentiment, or toxicity, of the generated language{---}ideally tailored towards each specific use case and target audience. For auto-regressive language models, existing guidance methods are prone to decoding errors that cascade during generation and degrade performance. In contrast, text diffusion models can easily be guided with, for example, a simple linear sentiment classifier{---}however they do suffer from significantly higher perplexity than auto-regressive alternatives. In this paper we use a guided diffusion model to produce a latent proposal that steers an auto-regressive language model to generate text with desired properties. Our model inherits the unmatched fluency of the auto-regressive approach and the plug-and-play flexibility of diffusion. We show that it outperforms previous plug-and-play guidance methods across a wide range of benchmark data sets. Further, controlling a new attribute in our framework is reduced to training a single logistic regression classifier."
}
Markdown (Informal)
[Diffusion Guided Language Modeling](https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-acl.887/) (Lovelace et al., Findings 2024)
ACL
- Justin Lovelace, Varsha Kishore, Yiwei Chen, and Kilian Weinberger. 2024. Diffusion Guided Language Modeling. In Findings of the Association for Computational Linguistics: ACL 2024, pages 14936–14952, Bangkok, Thailand. Association for Computational Linguistics.