@inproceedings{devlin-2017-sharp, title = "Sharp Models on Dull Hardware: Fast and Accurate Neural Machine Translation Decoding on the {CPU}", author = "Devlin, Jacob", editor = "Palmer, Martha and Hwa, Rebecca and Riedel, Sebastian", booktitle = "Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing", month = sep, year = "2017", address = "Copenhagen, Denmark", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/D17-1300/", doi = "10.18653/v1/D17-1300", pages = "2820--2825" }