@inproceedings{farahani-johansson-2023-empirical,
title = "An Empirical Study of Multitask Learning to Improve Open Domain Dialogue Systems",
author = "Farahani, Mehrdad and
Johansson, Richard",
editor = {Alum{\"a}e, Tanel and
Fishel, Mark},
booktitle = "Proceedings of the 24th Nordic Conference on Computational Linguistics (NoDaLiDa)",
month = may,
year = "2023",
address = "T{\'o}rshavn, Faroe Islands",
publisher = "University of Tartu Library",
url = "https://preview.aclanthology.org/fix-sig-urls/2023.nodalida-1.36/",
pages = "347--357",
abstract = "Autoregressive models used to generate responses in open-domain dialogue systems often struggle to take long-term context into account and to maintain consistency over a dialogue. Previous research in open-domain dialogue generation has shown that the use of \textit{auxiliary tasks} can introduce inductive biases that encourage the model to improve these qualities. However, most previous research has focused on encoder-only or encoder/decoder models, while the use of auxiliary tasks in \textit{encoder-only} autoregressive models is under-explored. This paper describes an investigation where four different auxiliary tasks are added to small and medium-sized GPT-2 models fine-tuned on the PersonaChat and DailyDialog datasets. The results show that the introduction of the new auxiliary tasks leads to small but consistent improvement in evaluations of the investigated models."
}
Markdown (Informal)
[An Empirical Study of Multitask Learning to Improve Open Domain Dialogue Systems](https://preview.aclanthology.org/fix-sig-urls/2023.nodalida-1.36/) (Farahani & Johansson, NoDaLiDa 2023)
ACL