@inproceedings{du-etal-2024-revisiting,
title = "Revisiting the {M}arkov Property for Machine Translation",
author = "Du, Cunxiao and
Zhou, Hao and
Tu, Zhaopeng and
Jiang, Jing",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Findings of the Association for Computational Linguistics: EACL 2024",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-eacl.40/",
pages = "582--588",
abstract = "In this paper, we re-examine the Markov property in the context of neural machine translation. We design a Markov Autoregressive Transformer (MAT) and undertake a comprehensive assessment of its performance across four WMT benchmarks. Our findings indicate that MAT with an order larger than 4 can generate translations with quality on par with that of conventional autoregressive transformers. In addition, counter-intuitively, we also find that the advantages of utilizing a higher-order MAT do not specifically contribute to the translation of longer sentences."
}
Markdown (Informal)
[Revisiting the Markov Property for Machine Translation](https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.findings-eacl.40/) (Du et al., Findings 2024)
ACL