@inproceedings{xiao-etal-2023-variator, title = "Variator: Accelerating Pre-trained Models with Plug-and-Play Compression Modules", author = "Xiao, Chaojun and Luo, Yuqi and Zhang, Wenbin and Zhang, Pengle and Han, Xu and Lin, Yankai and Zhang, Zhengyan and Xie, Ruobing and Liu, Zhiyuan and Sun, Maosong and Zhou, Jie", editor = "Bouamor, Houda and Pino, Juan and Bali, Kalika", booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2023", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2023.findings-emnlp.666/", doi = "10.18653/v1/2023.findings-emnlp.666", pages = "9947--9959" }