@inproceedings{ji-etal-2025-pku,
    title = "{PKU}-{S}afe{RLHF}: Towards Multi-Level Safety Alignment for {LLM}s with Human Preference",
    author = "Ji, Jiaming  and
      Hong, Donghai  and
      Zhang, Borong  and
      Chen, Boyuan  and
      Dai, Josef  and
      Zheng, Boren  and
      Qiu, Tianyi Alex  and
      Zhou, Jiayi  and
      Wang, Kaile  and
      Li, Boxun  and
      Han, Sirui  and
      Guo, Yike  and
      Yang, Yaodong",
    editor = "Che, Wanxiang  and
      Nabende, Joyce  and
      Shutova, Ekaterina  and
      Pilehvar, Mohammad Taher",
    booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
    month = jul,
    year = "2025",
    address = "Vienna, Austria",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.1544/",
    pages = "31983--32016",
    ISBN = "979-8-89176-251-0"
}