@inproceedings{ratnakar-vats-2026-geometry, title = "The Geometry of Refusal: Linear Instability in Safety-Aligned {LLM}s", author = "Ratnakar, Shivam and Vats, Kartikeya", editor = "Chang, Kai-Wei and Mehrabi, Ninareh and Krishna, Satyapriya and Das, Anubrata and Dhamala, Jwala and Cao, Yang Trista and Kumarage, Tharindu and Ramakrishna, Anil and Christodoulopoulos, Christos and Wan, Yixin and Galystan, Aram and Kumar, Anoop and Gupta, Rahul", booktitle = "Proceedings of the 6th Workshop on Trustworthy {NLP} ({T}rust{NLP} 2026)", month = jul, year = "2026", address = "San Diego, California", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.trustnlp-main.51/", pages = "653--662", ISBN = "979-8-89176-418-7" }