@inproceedings{anees-etal-2020-developing,
title = "Developing a Monolingual Sentence Simplification Corpus for {U}rdu",
author = "Anees, Yusra and
Abdul Rauf, Sadaf and
Iqbal, Nauman and
Siddiqi, Abdul Basit",
booktitle = "Proceedings of the The Fourth Widening Natural Language Processing Workshop",
month = jul,
year = "2020",
address = "Seattle, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2020.winlp-1.23",
doi = "10.18653/v1/2020.winlp-1.23",
pages = "92--95",
abstract = "Complex sentences are a hurdle in the learning process of language learners. Sentence simplification aims to convert a complex sentence into its simpler form such that it is easily comprehensible. To build such automated simplification systems, corpora of complex sentences and their simplified versions is the first step to understand sentence complexity and enable the development of automatic text simplification systems. No such corpus has yet been developed for Urdu and we fill this gap by developing one such corpus to help start readability and automatic sentence simplification research. We present a lexical and syntactically simplified Urdu simplification corpus and a detailed analysis of the various simplification operations. We further analyze our corpora using text readability measures and present a comparison of the original, lexical simplified, and syntactically simplified corpora.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="anees-etal-2020-developing">
<titleInfo>
<title>Developing a Monolingual Sentence Simplification Corpus for Urdu</title>
</titleInfo>
<name type="personal">
<namePart type="given">Yusra</namePart>
<namePart type="family">Anees</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Sadaf</namePart>
<namePart type="family">Abdul Rauf</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nauman</namePart>
<namePart type="family">Iqbal</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Abdul</namePart>
<namePart type="given">Basit</namePart>
<namePart type="family">Siddiqi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2020-jul</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the The Fourth Widening Natural Language Processing Workshop</title>
</titleInfo>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Seattle, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Complex sentences are a hurdle in the learning process of language learners. Sentence simplification aims to convert a complex sentence into its simpler form such that it is easily comprehensible. To build such automated simplification systems, corpora of complex sentences and their simplified versions is the first step to understand sentence complexity and enable the development of automatic text simplification systems. No such corpus has yet been developed for Urdu and we fill this gap by developing one such corpus to help start readability and automatic sentence simplification research. We present a lexical and syntactically simplified Urdu simplification corpus and a detailed analysis of the various simplification operations. We further analyze our corpora using text readability measures and present a comparison of the original, lexical simplified, and syntactically simplified corpora.</abstract>
<identifier type="citekey">anees-etal-2020-developing</identifier>
<identifier type="doi">10.18653/v1/2020.winlp-1.23</identifier>
<location>
<url>https://aclanthology.org/2020.winlp-1.23</url>
</location>
<part>
<date>2020-jul</date>
<extent unit="page">
<start>92</start>
<end>95</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Developing a Monolingual Sentence Simplification Corpus for Urdu
%A Anees, Yusra
%A Abdul Rauf, Sadaf
%A Iqbal, Nauman
%A Siddiqi, Abdul Basit
%S Proceedings of the The Fourth Widening Natural Language Processing Workshop
%D 2020
%8 jul
%I Association for Computational Linguistics
%C Seattle, USA
%F anees-etal-2020-developing
%X Complex sentences are a hurdle in the learning process of language learners. Sentence simplification aims to convert a complex sentence into its simpler form such that it is easily comprehensible. To build such automated simplification systems, corpora of complex sentences and their simplified versions is the first step to understand sentence complexity and enable the development of automatic text simplification systems. No such corpus has yet been developed for Urdu and we fill this gap by developing one such corpus to help start readability and automatic sentence simplification research. We present a lexical and syntactically simplified Urdu simplification corpus and a detailed analysis of the various simplification operations. We further analyze our corpora using text readability measures and present a comparison of the original, lexical simplified, and syntactically simplified corpora.
%R 10.18653/v1/2020.winlp-1.23
%U https://aclanthology.org/2020.winlp-1.23
%U https://doi.org/10.18653/v1/2020.winlp-1.23
%P 92-95
Markdown (Informal)
[Developing a Monolingual Sentence Simplification Corpus for Urdu](https://aclanthology.org/2020.winlp-1.23) (Anees et al., WiNLP 2020)
ACL