@inproceedings{murakami-etal-2019-ntts,
title = "{NTT}{'}s Machine Translation Systems for {WMT}19 Robustness Task",
author = "Murakami, Soichiro and
Morishita, Makoto and
Hirao, Tsutomu and
Nagata, Masaaki",
booktitle = "Proceedings of the Fourth Conference on Machine Translation (Volume 2: Shared Task Papers, Day 1)",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-5365",
doi = "10.18653/v1/W19-5365",
pages = "544--551",
abstract = "This paper describes NTT{'}s submission to the WMT19 robustness task. This task mainly focuses on translating noisy text (e.g., posts on Twitter), which presents different difficulties from typical translation tasks such as news. Our submission combined techniques including utilization of a synthetic corpus, domain adaptation, and a placeholder mechanism, which significantly improved over the previous baseline. Experimental results revealed the placeholder mechanism, which temporarily replaces the non-standard tokens including emojis and emoticons with special placeholder tokens during translation, improves translation accuracy even with noisy texts.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="murakami-etal-2019-ntts">
<titleInfo>
<title>NTT’s Machine Translation Systems for WMT19 Robustness Task</title>
</titleInfo>
<name type="personal">
<namePart type="given">Soichiro</namePart>
<namePart type="family">Murakami</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Makoto</namePart>
<namePart type="family">Morishita</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tsutomu</namePart>
<namePart type="family">Hirao</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Masaaki</namePart>
<namePart type="family">Nagata</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-aug</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Fourth Conference on Machine Translation (Volume 2: Shared Task Papers, Day 1)</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This paper describes NTT’s submission to the WMT19 robustness task. This task mainly focuses on translating noisy text (e.g., posts on Twitter), which presents different difficulties from typical translation tasks such as news. Our submission combined techniques including utilization of a synthetic corpus, domain adaptation, and a placeholder mechanism, which significantly improved over the previous baseline. Experimental results revealed the placeholder mechanism, which temporarily replaces the non-standard tokens including emojis and emoticons with special placeholder tokens during translation, improves translation accuracy even with noisy texts.</abstract>
<identifier type="citekey">murakami-etal-2019-ntts</identifier>
<identifier type="doi">10.18653/v1/W19-5365</identifier>
<location>
<url>https://aclanthology.org/W19-5365</url>
</location>
<part>
<date>2019-aug</date>
<extent unit="page">
<start>544</start>
<end>551</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T NTT’s Machine Translation Systems for WMT19 Robustness Task
%A Murakami, Soichiro
%A Morishita, Makoto
%A Hirao, Tsutomu
%A Nagata, Masaaki
%S Proceedings of the Fourth Conference on Machine Translation (Volume 2: Shared Task Papers, Day 1)
%D 2019
%8 aug
%I Association for Computational Linguistics
%C Florence, Italy
%F murakami-etal-2019-ntts
%X This paper describes NTT’s submission to the WMT19 robustness task. This task mainly focuses on translating noisy text (e.g., posts on Twitter), which presents different difficulties from typical translation tasks such as news. Our submission combined techniques including utilization of a synthetic corpus, domain adaptation, and a placeholder mechanism, which significantly improved over the previous baseline. Experimental results revealed the placeholder mechanism, which temporarily replaces the non-standard tokens including emojis and emoticons with special placeholder tokens during translation, improves translation accuracy even with noisy texts.
%R 10.18653/v1/W19-5365
%U https://aclanthology.org/W19-5365
%U https://doi.org/10.18653/v1/W19-5365
%P 544-551
Markdown (Informal)
[NTT’s Machine Translation Systems for WMT19 Robustness Task](https://aclanthology.org/W19-5365) (Murakami et al., 2019)
ACL
- Soichiro Murakami, Makoto Morishita, Tsutomu Hirao, and Masaaki Nagata. 2019. NTT’s Machine Translation Systems for WMT19 Robustness Task. In Proceedings of the Fourth Conference on Machine Translation (Volume 2: Shared Task Papers, Day 1), pages 544–551, Florence, Italy. Association for Computational Linguistics.