@inproceedings{kondratyuk-etal-2018-lemmatag,
title = "{L}emma{T}ag: Jointly Tagging and Lemmatizing for Morphologically Rich Languages with {BRNN}s",
author = "Kondratyuk, Daniel and
Gaven{\v{c}}iak, Tom{\'a}{\v{s}} and
Straka, Milan and
Haji{\v{c}}, Jan",
booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing",
month = oct # "-" # nov,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/D18-1532",
doi = "10.18653/v1/D18-1532",
pages = "4921--4928",
abstract = "We present LemmaTag, a featureless neural network architecture that jointly generates part-of-speech tags and lemmas for sentences by using bidirectional RNNs with character-level and word-level embeddings. We demonstrate that both tasks benefit from sharing the encoding part of the network, predicting tag subcategories, and using the tagger output as an input to the lemmatizer. We evaluate our model across several languages with complex morphology, which surpasses state-of-the-art accuracy in both part-of-speech tagging and lemmatization in Czech, German, and Arabic.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="kondratyuk-etal-2018-lemmatag">
<titleInfo>
<title>LemmaTag: Jointly Tagging and Lemmatizing for Morphologically Rich Languages with BRNNs</title>
</titleInfo>
<name type="personal">
<namePart type="given">Daniel</namePart>
<namePart type="family">Kondratyuk</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tomáš</namePart>
<namePart type="family">Gavenčiak</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Milan</namePart>
<namePart type="family">Straka</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jan</namePart>
<namePart type="family">Hajič</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2018-oct"-"nov</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Brussels, Belgium</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>We present LemmaTag, a featureless neural network architecture that jointly generates part-of-speech tags and lemmas for sentences by using bidirectional RNNs with character-level and word-level embeddings. We demonstrate that both tasks benefit from sharing the encoding part of the network, predicting tag subcategories, and using the tagger output as an input to the lemmatizer. We evaluate our model across several languages with complex morphology, which surpasses state-of-the-art accuracy in both part-of-speech tagging and lemmatization in Czech, German, and Arabic.</abstract>
<identifier type="citekey">kondratyuk-etal-2018-lemmatag</identifier>
<identifier type="doi">10.18653/v1/D18-1532</identifier>
<location>
<url>https://aclanthology.org/D18-1532</url>
</location>
<part>
<date>2018-oct"-"nov</date>
<extent unit="page">
<start>4921</start>
<end>4928</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T LemmaTag: Jointly Tagging and Lemmatizing for Morphologically Rich Languages with BRNNs
%A Kondratyuk, Daniel
%A Gavenčiak, Tomáš
%A Straka, Milan
%A Hajič, Jan
%S Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing
%D 2018
%8 oct" "nov
%I Association for Computational Linguistics
%C Brussels, Belgium
%F kondratyuk-etal-2018-lemmatag
%X We present LemmaTag, a featureless neural network architecture that jointly generates part-of-speech tags and lemmas for sentences by using bidirectional RNNs with character-level and word-level embeddings. We demonstrate that both tasks benefit from sharing the encoding part of the network, predicting tag subcategories, and using the tagger output as an input to the lemmatizer. We evaluate our model across several languages with complex morphology, which surpasses state-of-the-art accuracy in both part-of-speech tagging and lemmatization in Czech, German, and Arabic.
%R 10.18653/v1/D18-1532
%U https://aclanthology.org/D18-1532
%U https://doi.org/10.18653/v1/D18-1532
%P 4921-4928
Markdown (Informal)
[LemmaTag: Jointly Tagging and Lemmatizing for Morphologically Rich Languages with BRNNs](https://aclanthology.org/D18-1532) (Kondratyuk et al., EMNLP 2018)
ACL