@inproceedings{wen-etal-2022-empirical,
title = "An Empirical Study on the Overlapping Problem of Open-Domain Dialogue Datasets",
author = "Wen, Yuqiao and
Luo, Guoqing and
Mou, Lili",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2022.lrec-1.16/",
pages = "146--153",
abstract = "Open-domain dialogue systems aim to converse with humans through text, and dialogue research has heavily relied on benchmark datasets. In this work, we observe the overlapping problem in DailyDialog and OpenSubtitles, two popular open-domain dialogue benchmark datasets. Our systematic analysis then shows that such overlapping can be exploited to obtain fake state-of-the-art performance. Finally, we address this issue by cleaning these datasets and setting up a proper data processing procedure for future research."
}
Markdown (Informal)
[An Empirical Study on the Overlapping Problem of Open-Domain Dialogue Datasets](https://preview.aclanthology.org/add-emnlp-2024-awards/2022.lrec-1.16/) (Wen et al., LREC 2022)
ACL