@inproceedings{tu-etal-2018-pay, title = "Pay-Per-Request Deployment of Neural Network Models Using Serverless Architectures", author = "Tu, Zhucheng and Li, Mengping and Lin, Jimmy", editor = "Liu, Yang and Paek, Tim and Patwardhan, Manasi", booktitle = "Proceedings of the 2018 Conference of the North {A}merican Chapter of the Association for Computational Linguistics: Demonstrations", month = jun, year = "2018", address = "New Orleans, Louisiana", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/N18-5002/", doi = "10.18653/v1/N18-5002", pages = "6--10" }