@inproceedings{demirag-etal-2024-benchmarking,
title = "Benchmarking Diffusion Models for Machine Translation",
author = "Demirag, Yunus and
Liu, Danni and
Niehues, Jan",
editor = "Falk, Neele and
Papi, Sara and
Zhang, Mike",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics: Student Research Workshop",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2024.eacl-srw.25/",
pages = "313--324",
abstract = "Diffusion models have recently shown great potential on many generative tasks.In this work, we explore diffusion models for machine translation (MT).We adapt two prominent diffusion-based text generation models, Diffusion-LM and DiffuSeq, to perform machine translation.As the diffusion models generate non-autoregressively (NAR),we draw parallels to NAR machine translation models.With a comparison to conventional Transformer-based translation models, as well as to the Levenshtein Transformer,an established NAR MT model,we show that the multimodality problem that limits NAR machine translation performance is also a challenge to diffusion models.We demonstrate that knowledge distillation from an autoregressive model improves the performance of diffusion-based MT.A thorough analysis on the translation quality of inputs of different lengths shows that the diffusion models struggle more on long-range dependencies than other models."
}
Markdown (Informal)
[Benchmarking Diffusion Models for Machine Translation](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2024.eacl-srw.25/) (Demirag et al., EACL 2024)
ACL
- Yunus Demirag, Danni Liu, and Jan Niehues. 2024. Benchmarking Diffusion Models for Machine Translation. In Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics: Student Research Workshop, pages 313–324, St. Julian’s, Malta. Association for Computational Linguistics.