@inproceedings{del-etal-2018-phrase,
title = "Phrase-based Unsupervised Machine Translation with Compositional Phrase Embeddings",
author = {Del, Maksym and
T{\"a}ttar, Andre and
Fishel, Mark},
booktitle = "Proceedings of the Third Conference on Machine Translation: Shared Task Papers",
month = oct,
year = "2018",
address = "Belgium, Brussels",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W18-6407",
doi = "10.18653/v1/W18-6407",
pages = "361--367",
abstract = "This paper describes the University of Tartu{'}s submission to the unsupervised machine translation track of WMT18 news translation shared task. We build several baseline translation systems for both directions of the English-Estonian language pair using monolingual data only; the systems belong to the phrase-based unsupervised machine translation paradigm where we experimented with phrase lengths of up to 3. As a main contribution, we performed a set of standalone experiments with compositional phrase embeddings as a substitute for phrases as individual vocabulary entries. Results show that reasonable n-gram vectors can be obtained by simply summing up individual word vectors which retains or improves the performance of phrase-based unsupervised machine tranlation systems while avoiding limitations of atomic phrase vectors.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="del-etal-2018-phrase">
<titleInfo>
<title>Phrase-based Unsupervised Machine Translation with Compositional Phrase Embeddings</title>
</titleInfo>
<name type="personal">
<namePart type="given">Maksym</namePart>
<namePart type="family">Del</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Andre</namePart>
<namePart type="family">Tättar</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Mark</namePart>
<namePart type="family">Fishel</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-oct</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Third Conference on Machine Translation: Shared Task Papers</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Belgium, Brussels</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper describes the University of Tartu’s submission to the unsupervised machine translation track of WMT18 news translation shared task. We build several baseline translation systems for both directions of the English-Estonian language pair using monolingual data only; the systems belong to the phrase-based unsupervised machine translation paradigm where we experimented with phrase lengths of up to 3. As a main contribution, we performed a set of standalone experiments with compositional phrase embeddings as a substitute for phrases as individual vocabulary entries. Results show that reasonable n-gram vectors can be obtained by simply summing up individual word vectors which retains or improves the performance of phrase-based unsupervised machine tranlation systems while avoiding limitations of atomic phrase vectors.</abstract>
<identifier type="citekey">del-etal-2018-phrase</identifier>
<identifier type="doi">10.18653/v1/W18-6407</identifier>
<location>
<url>https://aclanthology.org/W18-6407</url>
</location>
<part>
<date>2018-oct</date>
<extent unit="page">
<start>361</start>
<end>367</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Phrase-based Unsupervised Machine Translation with Compositional Phrase Embeddings
%A Del, Maksym
%A Tättar, Andre
%A Fishel, Mark
%S Proceedings of the Third Conference on Machine Translation: Shared Task Papers
%D 2018
%8 oct
%I Association for Computational Linguistics
%C Belgium, Brussels
%F del-etal-2018-phrase
%X This paper describes the University of Tartu’s submission to the unsupervised machine translation track of WMT18 news translation shared task. We build several baseline translation systems for both directions of the English-Estonian language pair using monolingual data only; the systems belong to the phrase-based unsupervised machine translation paradigm where we experimented with phrase lengths of up to 3. As a main contribution, we performed a set of standalone experiments with compositional phrase embeddings as a substitute for phrases as individual vocabulary entries. Results show that reasonable n-gram vectors can be obtained by simply summing up individual word vectors which retains or improves the performance of phrase-based unsupervised machine tranlation systems while avoiding limitations of atomic phrase vectors.
%R 10.18653/v1/W18-6407
%U https://aclanthology.org/W18-6407
%U https://doi.org/10.18653/v1/W18-6407
%P 361-367
Markdown (Informal)
[Phrase-based Unsupervised Machine Translation with Compositional Phrase Embeddings](https://aclanthology.org/W18-6407) (Del et al., 2018)
ACL