@inproceedings{singh-2012-addressing,
title = "Addressing some Issues of Data Sparsity towards Improving {E}nglish- {M}anipuri {SMT} using Morphological Information",
author = "Singh, Thoudam Doren",
booktitle = "Workshop on Monolingual Machine Translation",
month = oct # " 28-" # nov # " 1",
year = "2012",
address = "San Diego, California, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2012.amta-monomt.6",
abstract = "The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="singh-2012-addressing">
<titleInfo>
<title>Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information</title>
</titleInfo>
<name type="personal">
<namePart type="given">Thoudam</namePart>
<namePart type="given">Doren</namePart>
<namePart type="family">Singh</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2012-oct" 28-"nov" 1"</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Workshop on Monolingual Machine Translation</title>
</titleInfo>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">San Diego, California, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.</abstract>
<identifier type="citekey">singh-2012-addressing</identifier>
<location>
<url>https://aclanthology.org/2012.amta-monomt.6</url>
</location>
<part>
<date>2012-oct" 28-"nov" 1"</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information
%A Singh, Thoudam Doren
%S Workshop on Monolingual Machine Translation
%D 2012
%8 oct" 28 "nov" 1"
%I Association for Machine Translation in the Americas
%C San Diego, California, USA
%F singh-2012-addressing
%X The performance of an SMT system heavily depends on the availability of large parallel corpora. Unavailability of these resources in the required amount for many language pair is a challenging issue. The required size of the resource involving morphologically rich and highly agglutinative language is essentially much more for the SMT systems. This paper investigates on some of the issues on enriching the resource for this kind of languages. Handling of inflectional and derivational morphemes of the morphologically rich target language plays important role in the enrichment process. Mapping from the source to the target side is carried out for the English-Manipuri SMT task using factored model. The SMT system developed shows improvement in the performance both in terms of the automatic scoring and subjective evaluation over the baseline system.
%U https://aclanthology.org/2012.amta-monomt.6
Markdown (Informal)
[Addressing some Issues of Data Sparsity towards Improving English- Manipuri SMT using Morphological Information](https://aclanthology.org/2012.amta-monomt.6) (Singh, AMTA 2012)
ACL