@inproceedings{wu-etal-2021-universal, title = "Universal-{KD}: Attention-based Output-Grounded Intermediate Layer Knowledge Distillation", author = "Wu, Yimeng and Rezagholizadeh, Mehdi and Ghaddar, Abbas and Haidar, Md Akmal and Ghodsi, Ali", editor = "Moens, Marie-Francine and Huang, Xuanjing and Specia, Lucia and Yih, Scott Wen-tau", booktitle = "Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2021", address = "Online and Punta Cana, Dominican Republic", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2021.emnlp-main.603/", doi = "10.18653/v1/2021.emnlp-main.603", pages = "7649--7661" }