@inproceedings{kurtic-etal-2022-optimal, title = "The Optimal {BERT} Surgeon: Scalable and Accurate Second-Order Pruning for Large Language Models", author = "Kurtic, Eldar and Campos, Daniel and Nguyen, Tuan and Frantar, Elias and Kurtz, Mark and Fineran, Benjamin and Goin, Michael and Alistarh, Dan", editor = "Goldberg, Yoav and Kozareva, Zornitsa and Zhang, Yue", booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing", month = dec, year = "2022", address = "Abu Dhabi, United Arab Emirates", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2022.emnlp-main.279/", doi = "10.18653/v1/2022.emnlp-main.279", pages = "4163--4181" }