@article{mu-etal-2026-cross, title = "Cross-layer Attention Sharing for Pre-trained Large Language Models", author = "Mu, Yongyu and Wu, Yuzhang and Fan, Yuchun and Wang, Chenglong and Li, Hengyu and Zeng, Jiali and He, Qiaozhi and Yang, Murun and Meng, Fandong and Zhou, Jie and Xiao, Tong and Zhu, Jingbo", journal = "Transactions of the Association for Computational Linguistics", volume = "14", year = "2026", address = "Cambridge, MA", publisher = "MIT Press", url = "https://preview.aclanthology.org/ingest-latest-mitpress-cl-tacl/2026.tacl-1.30/", doi = "10.1162/tacl.a.616", pages = "656--688" }