@inproceedings{kou-etal-2024-knn,
title = "{KNN}-Instruct: Automatic Instruction Construction with K Nearest Neighbor Deduction",
author = "Kou, Jianshang and
Xu, Benfeng and
Zhu, Chiwei and
Mao, Zhendong",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.emnlp-main.577/",
doi = "10.18653/v1/2024.emnlp-main.577",
pages = "10337--10350",
abstract = "Supervised fine-tuning (SFT) is a critical procedure for aligning large language models. Despite its efficiency, the construction of SFT data often struggles with issues of quality, diversity, and scalability. Many existing methods, inspired by the Self-Instruct framework, typically generate synthetic instructions by prompting aligned proprietary models like ChatGPT. However, such process suffers from stale distribution, resulting in instructions that are merely trivial variations of existing ones. In this paper, we introduce a novel bootstrapping approach termed KNN-Instruct, which incorporates KNN deduction to produce meaningful new instructions by effectively summarizing and learning from similar existing ones. We conduct an economical controlled experiment to preliminarily validate its effectiveness. In the further experiment, we construct a high-quality SFT dataset named KNN-Inst-12k*. Applying the dataset to Qwen-2-7B, we get a MT-Bench score of 7.64, which outperforms all 7B models on the LMSYS leaderboard, including Starling-LM-7B (7.48), OpenChat-3.5 (7.06) and Zephyr-7B-beta (6.53). Our code and data are available at https://github.com/CrossmodalGroup/KNN-Instruct/."
}
Markdown (Informal)
[KNN-Instruct: Automatic Instruction Construction with K Nearest Neighbor Deduction](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.emnlp-main.577/) (Kou et al., EMNLP 2024)
ACL