@inproceedings{zhu-etal-2020-batch, title = "A Batch Normalized Inference Network Keeps the {KL} Vanishing Away", author = "Zhu, Qile and Bi, Wei and Liu, Xiaojiang and Ma, Xiyao and Li, Xiaolin and Wu, Dapeng", editor = "Jurafsky, Dan and Chai, Joyce and Schluter, Natalie and Tetreault, Joel", booktitle = "Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics", month = jul, year = "2020", address = "Online", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2020.acl-main.235/", doi = "10.18653/v1/2020.acl-main.235", pages = "2636--2649" }