@inproceedings{hasan-etal-2024-pruning, title = "Pruning for Protection: Increasing Jailbreak Resistance in Aligned {LLM}s Without Fine-Tuning", author = "Hasan, Adib and Rugina, Ileana and Wang, Alex", editor = "Belinkov, Yonatan and Kim, Najoung and Jumelet, Jaap and Mohebbi, Hosein and Mueller, Aaron and Chen, Hanjie", booktitle = "Proceedings of the 7th BlackboxNLP Workshop: Analyzing and Interpreting Neural Networks for NLP", month = nov, year = "2024", address = "Miami, Florida, US", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.blackboxnlp-1.26/", doi = "10.18653/v1/2024.blackboxnlp-1.26", pages = "417--430" }