@inproceedings{sinha-etal-2024-survival,
title = "Survival of the Safest: Towards Secure Prompt Optimization through Interleaved Multi-Objective Evolution",
author = "Sinha, Ankita and
Cui, Wendi and
Das, Kamalika and
Zhang, Jiaxin",
editor = "Dernoncourt, Franck and
Preo{\c{t}}iuc-Pietro, Daniel and
Shimorina, Anastasia",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing: Industry Track",
month = nov,
year = "2024",
address = "Miami, Florida, US",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.emnlp-industry.76/",
doi = "10.18653/v1/2024.emnlp-industry.76",
pages = "1016--1027",
abstract = "Large language models (LLMs) have demonstrated remarkable capabilities; however, the optimization of their prompts has historically prioritized performance metrics at the expense of crucial safety and security considerations. To overcome this shortcoming, we introduce ``Survival of the Safest'' (), an innovative multi-objective prompt optimization framework that enhances both performance and security in LLMs simultaneously. utilizes an interleaved multi-objective evolution strategy, integrating semantic, feedback, and crossover mutations to effectively traverse the prompt landscape. Differing from the computationally demanding Pareto front methods, provides a scalable solution that expedites optimization in complex, high-dimensional discrete search spaces while keeping computational demands low. Our approach accommodates flexible weighting of objectives and generates a pool of optimized candidates, empowering users to select prompts that optimally meet their specific performance and security needs. Experimental evaluations across diverse benchmark datasets affirm `s efficacy in delivering high performance and notably enhancing safety and security compared to single-objective methods. This advancement marks a significant stride towards the deployment of LLM systems that are both high-performing and secure across varied industrial applications"
}
Markdown (Informal)
[Survival of the Safest: Towards Secure Prompt Optimization through Interleaved Multi-Objective Evolution](https://preview.aclanthology.org/fix-sig-urls/2024.emnlp-industry.76/) (Sinha et al., EMNLP 2024)
ACL