@inproceedings{kalpakchi-boye-2023-quasi,
title = "Quasi: a synthetic Question-Answering dataset in {S}wedish using {GPT}-3 and zero-shot learning",
author = "Kalpakchi, Dmytro and
Boye, Johan",
editor = {Alum{\"a}e, Tanel and
Fishel, Mark},
booktitle = "Proceedings of the 24th Nordic Conference on Computational Linguistics (NoDaLiDa)",
month = may,
year = "2023",
address = "T{\'o}rshavn, Faroe Islands",
publisher = "University of Tartu Library",
url = "https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2023.nodalida-1.48/",
pages = "477--491",
abstract = "This paper describes the creation and evaluation of a synthetic dataset of Swedish multiple-choice questions (MCQs) for reading comprehension using GPT-3. Although GPT-3 is trained mostly on English data, with only 0.11{\%} of Swedish texts in its training material, the model still managed to generate MCQs in Swedish. About 44{\%} of the generated MCQs turned out to be of sufficient quality, i.e. they were grammatically correct and relevant, with exactly one answer alternative being correct and the others being plausible but wrong. We provide a detailed analysis of the errors and shortcomings of the rejected MCQs, as well an analysis of the level of difficulty of the accepted MCQs. In addition to giving insights into GPT-3, the synthetic dataset could be used for training and evaluation of special-purpose MCQ-generating models."
}
Markdown (Informal)
[Quasi: a synthetic Question-Answering dataset in Swedish using GPT-3 and zero-shot learning](https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2023.nodalida-1.48/) (Kalpakchi & Boye, NoDaLiDa 2023)
ACL