@inproceedings{currey-etal-2020-distilling,
title = "Distilling Multiple Domains for Neural Machine Translation",
author = "Currey, Anna and
Mathur, Prashant and
Dinu, Georgiana",
editor = "Webber, Bonnie and
Cohn, Trevor and
He, Yulan and
Liu, Yang",
booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)",
month = nov,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.emnlp-main.364/",
doi = "10.18653/v1/2020.emnlp-main.364",
pages = "4500--4511",
abstract = "Neural machine translation achieves impressive results in high-resource conditions, but performance often suffers when the input domain is low-resource. The standard practice of adapting a separate model for each domain of interest does not scale well in practice from both a quality perspective (brittleness under domain shift) as well as a cost perspective (added maintenance and inference complexity). In this paper, we propose a framework for training a single multi-domain neural machine translation model that is able to translate several domains without increasing inference time or memory usage. We show that this model can improve translation on both high- and low-resource domains over strong multi-domain baselines. In addition, our proposed model is effective when domain labels are unknown during training, as well as robust under noisy data conditions."
}
Markdown (Informal)
[Distilling Multiple Domains for Neural Machine Translation](https://preview.aclanthology.org/jlcl-multiple-ingestion/2020.emnlp-main.364/) (Currey et al., EMNLP 2020)
ACL