@inproceedings{wichers-etal-2024-gradient, title = "Gradient-Based Language Model Red Teaming", author = "Wichers, Nevan and Denison, Carson and Beirami, Ahmad", editor = "Graham, Yvette and Purver, Matthew", booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)", month = mar, year = "2024", address = "St. Julian{'}s, Malta", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2024.eacl-long.175/", pages = "2862--2881" }