@inproceedings{khosla-gangadharaiah-2022-benchmarking,
title = "Benchmarking the Covariate Shift Robustness of Open-world Intent Classification Approaches",
author = "Khosla, Sopan and
Gangadharaiah, Rashmi",
editor = "He, Yulan and
Ji, Heng and
Li, Sujian and
Liu, Yang and
Chang, Chua-Hui",
booktitle = "Proceedings of the 2nd Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics and the 12th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)",
month = nov,
year = "2022",
address = "Online only",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2022.aacl-short.3/",
doi = "10.18653/v1/2022.aacl-short.3",
pages = "14--23",
abstract = "Task-oriented dialog systems deployed in real-world applications are often challenged by out-of-distribution queries. These systems should not only reliably detect utterances with unsupported intents (\textit{semantic shift}), but also generalize to \textit{covariate shift} (supported intents from unseen distributions). However, none of the existing benchmarks for open-world intent classification focus on the second aspect, thus only performing a partial evaluation of intent detection techniques. In this work, we propose two new datasets ( and ) that include utterances useful for evaluating the robustness of open-world models to covariate shift. Along with the i.i.d. test set, both datasets contain a new cov-test set that, along with out-of-scope utterances, contains in-scope utterances sampled from different distributions not seen during training. This setting better mimics the challenges faced in real-world applications. Evaluating several open-world classifiers on the new datasets reveals that models that perform well on the test set struggle to generalize to the cov-test. Our datasets fill an important gap in the field, offering a more realistic evaluation scenario for intent classification in task-oriented dialog systems."
}
Markdown (Informal)
[Benchmarking the Covariate Shift Robustness of Open-world Intent Classification Approaches](https://preview.aclanthology.org/fix-sig-urls/2022.aacl-short.3/) (Khosla & Gangadharaiah, AACL-IJCNLP 2022)
ACL