@inproceedings{zhang-etal-2023-ask,
title = "Ask an Expert: Leveraging Language Models to Improve Strategic Reasoning in Goal-Oriented Dialogue Models",
author = "Zhang, Qiang and
Naradowsky, Jason and
Miyao, Yusuke",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2023",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.findings-acl.417/",
doi = "10.18653/v1/2023.findings-acl.417",
pages = "6665--6694",
abstract = "Existing dialogue models may encounter scenarios which are not well-represented in the training data, and as a result generate responses that are unnatural, inappropriate, or unhelpful. We propose the {\textquotedblleft}Ask an Expert{\textquotedblright} framework in which the model is trained with access to an {\textquotedblleft}expert{\textquotedblright} which it can consult at each turn. Advice is solicited via a structured dialogue with the expert, and the model is optimized to selectively utilize (or ignore) it given the context and dialogue history. In this work the expert takes the form of an LLM.We evaluate this framework in a mental health support domain, where the structure of the expert conversation is outlined by pre-specified prompts which reflect a reasoning strategy taught to practitioners in the field. Blenderbot models utilizing {\textquotedblleft}Ask an Expert{\textquotedblright} show quality improvements across all expert sizes, including those with fewer parameters than the dialogue model itself. Our best model provides a {\textasciitilde}10{\%} improvement over baselines, approaching human-level scores on {\textquotedblleft}engingingness{\textquotedblright} and {\textquotedblleft}helpfulness{\textquotedblright} metrics."
}
Markdown (Informal)
[Ask an Expert: Leveraging Language Models to Improve Strategic Reasoning in Goal-Oriented Dialogue Models](https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.findings-acl.417/) (Zhang et al., Findings 2023)
ACL