@inproceedings{park-tsvetkov-2019-learning,
title = "Learning to Generate Word- and Phrase-Embeddings for Efficient Phrase-Based Neural Machine Translation",
author = "Park, Chan Young and
Tsvetkov, Yulia",
editor = "Birch, Alexandra and
Finch, Andrew and
Hayashi, Hiroaki and
Konstas, Ioannis and
Luong, Thang and
Neubig, Graham and
Oda, Yusuke and
Sudoh, Katsuhito",
booktitle = "Proceedings of the 3rd Workshop on Neural Generation and Translation",
month = nov,
year = "2019",
address = "Hong Kong",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest_wac_2008/D19-5626/",
doi = "10.18653/v1/D19-5626",
pages = "241--248",
abstract = "Neural machine translation (NMT) often fails in one-to-many translation, e.g., in the translation of multi-word expressions, compounds, and collocations. To improve the translation of phrases, phrase-based NMT systems have been proposed; these typically combine word-based NMT with external phrase dictionaries or with phrase tables from phrase-based statistical MT systems. These solutions introduce a significant overhead of additional resources and computational costs. In this paper, we introduce a phrase-based NMT model built upon continuous-output NMT, in which the decoder generates embeddings of words or phrases. The model uses a fertility module, which guides the decoder to generate embeddings of sequences of varying lengths. We show that our model learns to translate phrases better, performing on par with state of the art phrase-based NMT. Since our model does not resort to softmax computation over a huge vocabulary of phrases, its training time is about 112x faster than the baseline."
}
Markdown (Informal)
[Learning to Generate Word- and Phrase-Embeddings for Efficient Phrase-Based Neural Machine Translation](https://preview.aclanthology.org/ingest_wac_2008/D19-5626/) (Park & Tsvetkov, NGT 2019)
ACL