@inproceedings{holmer-rennes-2023-constructing,
title = "Constructing Pseudo-parallel {S}wedish Sentence Corpora for Automatic Text Simplification",
author = "Holmer, Daniel and
Rennes, Evelina",
editor = {Alum{\"a}e, Tanel and
Fishel, Mark},
booktitle = "Proceedings of the 24th Nordic Conference on Computational Linguistics (NoDaLiDa)",
month = may,
year = "2023",
address = "T{\'o}rshavn, Faroe Islands",
publisher = "University of Tartu Library",
url = "https://preview.aclanthology.org/fix-sig-urls/2023.nodalida-1.13/",
pages = "113--123",
abstract = "Automatic text simplification (ATS) describes the automatic transformation of a text from a complex form to a less complex form. Many modern ATS techniques need large parallel corpora of standard and simplified text, but such data does not exist for many languages. One way to overcome this issue is to create pseudo-parallel corpora by dividing existing corpora into standard and simple parts. In this work, we explore the creation of Swedish pseudo-parallel monolingual corpora by the application of different feature representation methods, sentence alignment algorithms, and indexing approaches, on a large monolingual corpus. The different corpora are used to fine-tune a sentence simplification system based on BART, which is evaluated with standard evaluation metrics for automatic text simplification."
}
Markdown (Informal)
[Constructing Pseudo-parallel Swedish Sentence Corpora for Automatic Text Simplification](https://preview.aclanthology.org/fix-sig-urls/2023.nodalida-1.13/) (Holmer & Rennes, NoDaLiDa 2023)
ACL