@inproceedings{manh-etal-2023-vault, title = "The Vault: A Comprehensive Multilingual Dataset for Advancing Code Understanding and Generation", author = "Manh, Dung Nguyen and Hai, Nam Le and Dau, Anh T. V. and Nguyen, Anh Minh and Nghiem, Khanh and Guo, Jin and Bui, Nghi D. Q.", editor = "Tan, Liling and Milajevs, Dmitrijs and Chauhan, Geeticka and Gwinnup, Jeremy and Rippeth, Elijah", booktitle = "Proceedings of the 3rd Workshop for Natural Language Processing Open Source Software (NLP-OSS 2023)", month = dec, year = "2023", address = "Singapore", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/fix-sig-urls/2023.nlposs-1.25/", doi = "10.18653/v1/2023.nlposs-1.25", pages = "219--244" }