@inproceedings{yadav-shrivastava-2020-a3,
title = "A3-108 Machine Translation System for Similar Language Translation Shared Task 2020",
author = "Yadav, Saumitra and
Shrivastava, Manish",
booktitle = "Proceedings of the Fifth Conference on Machine Translation",
month = nov,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2020.wmt-1.55",
pages = "451--455",
abstract = "In this paper, we describe our submissions for Similar Language Translation Shared Task 2020. We built 12 systems in each direction for Hindi⇐⇒Marathi language pair. This paper outlines initial baseline experiments with various tokenization schemes to train statistical models. Using optimal tokenization scheme among these we created synthetic source side text with back translation. And prune synthetic text with language model scores. This synthetic data was then used along with training data in various settings to build translation models. We also report configuration of the submitted systems and results produced by them.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="yadav-shrivastava-2020-a3">
<titleInfo>
<title>A3-108 Machine Translation System for Similar Language Translation Shared Task 2020</title>
</titleInfo>
<name type="personal">
<namePart type="given">Saumitra</namePart>
<namePart type="family">Yadav</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Manish</namePart>
<namePart type="family">Shrivastava</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-nov</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Fifth Conference on Machine Translation</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Online</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we describe our submissions for Similar Language Translation Shared Task 2020. We built 12 systems in each direction for Hindi⇐⇒Marathi language pair. This paper outlines initial baseline experiments with various tokenization schemes to train statistical models. Using optimal tokenization scheme among these we created synthetic source side text with back translation. And prune synthetic text with language model scores. This synthetic data was then used along with training data in various settings to build translation models. We also report configuration of the submitted systems and results produced by them.</abstract>
<identifier type="citekey">yadav-shrivastava-2020-a3</identifier>
<location>
<url>https://aclanthology.org/2020.wmt-1.55</url>
</location>
<part>
<date>2020-nov</date>
<extent unit="page">
<start>451</start>
<end>455</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A3-108 Machine Translation System for Similar Language Translation Shared Task 2020
%A Yadav, Saumitra
%A Shrivastava, Manish
%S Proceedings of the Fifth Conference on Machine Translation
%D 2020
%8 nov
%I Association for Computational Linguistics
%C Online
%F yadav-shrivastava-2020-a3
%X In this paper, we describe our submissions for Similar Language Translation Shared Task 2020. We built 12 systems in each direction for Hindi⇐⇒Marathi language pair. This paper outlines initial baseline experiments with various tokenization schemes to train statistical models. Using optimal tokenization scheme among these we created synthetic source side text with back translation. And prune synthetic text with language model scores. This synthetic data was then used along with training data in various settings to build translation models. We also report configuration of the submitted systems and results produced by them.
%U https://aclanthology.org/2020.wmt-1.55
%P 451-455
Markdown (Informal)
[A3-108 Machine Translation System for Similar Language Translation Shared Task 2020](https://aclanthology.org/2020.wmt-1.55) (Yadav & Shrivastava, WMT 2020)
ACL