@inproceedings{liu-etal-2024-pruning, title = "Pruning via Merging: Compressing {LLM}s via Manifold Alignment Based Layer Merging", author = "Liu, Deyuan and Qin, Zhanyue and Wang, Hairu and Yang, Zhao and Wang, Zecheng and Rong, Fangying and Liu, Qingbin and Hao, Yanchao and Li, Bo and Chen, Xi and Fan, Cunhang and Lv, Zhao and Chu, Dianhui and Tu, Zhiying and Sui, Dianbo", editor = "Al-Onaizan, Yaser and Bansal, Mohit and Chen, Yun-Nung", booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2024", address = "Miami, Florida, USA", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.emnlp-main.987/", doi = "10.18653/v1/2024.emnlp-main.987", pages = "17817--17829" }