@inproceedings{zhao-etal-2021-extremely, title = "Extremely Small {BERT} Models from Mixed-Vocabulary Training", author = "Zhao, Sanqiang and Gupta, Raghav and Song, Yang and Zhou, Denny", editor = "Merlo, Paola and Tiedemann, Jorg and Tsarfaty, Reut", booktitle = "Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume", month = apr, year = "2021", address = "Online", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest_wac_2008/2021.eacl-main.238/", doi = "10.18653/v1/2021.eacl-main.238", pages = "2753--2759" }