@inproceedings{he-glass-2020-negative,
title = "Negative Training for Neural Dialogue Response Generation",
author = "He, Tianxing and
Glass, James",
editor = "Jurafsky, Dan and
Chai, Joyce and
Schluter, Natalie and
Tetreault, Joel",
booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics",
month = jul,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2020.acl-main.185/",
doi = "10.18653/v1/2020.acl-main.185",
pages = "2044--2058",
abstract = "Although deep learning models have brought tremendous advancements to the field of open-domain dialogue response generation, recent research results have revealed that the trained models have undesirable generation behaviors, such as malicious responses and generic (boring) responses. In this work, we propose a framework named ``Negative Training'' to minimize such behaviors. Given a trained model, the framework will first find generated samples that exhibit the undesirable behavior, and then use them to feed negative training signals for fine-tuning the model. Our experiments show that negative training can significantly reduce the hit rate of malicious responses, or discourage frequent responses and improve response diversity."
}
Markdown (Informal)
[Negative Training for Neural Dialogue Response Generation](https://preview.aclanthology.org/fix-sig-urls/2020.acl-main.185/) (He & Glass, ACL 2020)
ACL