@inproceedings{sorokin-2020-getting,
title = "Getting More Data for Low-resource Morphological Inflection: Language Models and Data Augmentation",
author = "Sorokin, Alexey",
booktitle = "Proceedings of the 12th Language Resources and Evaluation Conference",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2020.lrec-1.490",
pages = "3978--3983",
abstract = "We investigate how to improve quality of low-resource morphological inflection without annotating more data. We examine two methods, language models and data augmentation. We show that the model whose decoder that additionally uses the states of the langauge model improves the model quality by 1.5{\%} in combination with both baselines. We also demonstrate that the augmentation of data improves performance by 9{\%} in average when adding 1000 artificially generated word forms to the dataset.",
language = "English",
ISBN = "979-10-95546-34-4",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="sorokin-2020-getting">
<titleInfo>
<title>Getting More Data for Low-resource Morphological Inflection: Language Models and Data Augmentation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Alexey</namePart>
<namePart type="family">Sorokin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-may</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<language>
<languageTerm type="text">English</languageTerm>
<languageTerm type="code" authority="iso639-2b">eng</languageTerm>
</language>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 12th Language Resources and Evaluation Conference</title>
</titleInfo>
<originInfo>
<publisher>European Language Resources Association</publisher>
<place>
<placeTerm type="text">Marseille, France</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-10-95546-34-4</identifier>
</relatedItem>
<abstract>We investigate how to improve quality of low-resource morphological inflection without annotating more data. We examine two methods, language models and data augmentation. We show that the model whose decoder that additionally uses the states of the langauge model improves the model quality by 1.5% in combination with both baselines. We also demonstrate that the augmentation of data improves performance by 9% in average when adding 1000 artificially generated word forms to the dataset.</abstract>
<identifier type="citekey">sorokin-2020-getting</identifier>
<location>
<url>https://aclanthology.org/2020.lrec-1.490</url>
</location>
<part>
<date>2020-may</date>
<extent unit="page">
<start>3978</start>
<end>3983</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Getting More Data for Low-resource Morphological Inflection: Language Models and Data Augmentation
%A Sorokin, Alexey
%S Proceedings of the 12th Language Resources and Evaluation Conference
%D 2020
%8 may
%I European Language Resources Association
%C Marseille, France
%@ 979-10-95546-34-4
%G English
%F sorokin-2020-getting
%X We investigate how to improve quality of low-resource morphological inflection without annotating more data. We examine two methods, language models and data augmentation. We show that the model whose decoder that additionally uses the states of the langauge model improves the model quality by 1.5% in combination with both baselines. We also demonstrate that the augmentation of data improves performance by 9% in average when adding 1000 artificially generated word forms to the dataset.
%U https://aclanthology.org/2020.lrec-1.490
%P 3978-3983
Markdown (Informal)
[Getting More Data for Low-resource Morphological Inflection: Language Models and Data Augmentation](https://aclanthology.org/2020.lrec-1.490) (Sorokin, LREC 2020)
ACL