@inproceedings{goriely-etal-2024-babble, title = "From Babble to Words: Pre-Training Language Models on Continuous Streams of Phonemes", author = "Goriely, Z{\'e}bulon and Diehl Martinez, Richard and Caines, Andrew and Buttery, Paula and Beinborn, Lisa", editor = "Hu, Michael Y. and Mueller, Aaron and Ross, Candace and Williams, Adina and Linzen, Tal and Zhuang, Chengxu and Choshen, Leshem and Cotterell, Ryan and Warstadt, Alex and Wilcox, Ethan Gotlieb", booktitle = "The 2nd BabyLM Challenge at the 28th Conference on Computational Natural Language Learning", month = nov, year = "2024", address = "Miami, FL, USA", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2024.conll-babylm.4/", pages = "37--53" }