@inproceedings{guven-etal-2025-syntactic,
title = "Do Syntactic Categories Help in Developmentally Motivated Curriculum Learning for Language Models?",
author = {G{\"u}ven, Arzu Burcu and
Rogers, Anna and
Goot, Rob Van Der},
editor = "Charpentier, Lucas and
Choshen, Leshem and
Cotterell, Ryan and
Gul, Mustafa Omer and
Hu, Michael Y. and
Liu, Jing and
Jumelet, Jaap and
Linzen, Tal and
Mueller, Aaron and
Ross, Candace and
Shah, Raj Sanjay and
Warstadt, Alex and
Wilcox, Ethan Gotlieb and
Williams, Adina",
booktitle = "Proceedings of the First BabyLM Workshop",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.babylm-main.22/",
pages = "288--300",
ISBN = "TODO",
abstract = "We examine the syntactic properties of BabyLM corpus, and age-groups within CHILDES. While we find that CHILDES does not exhibit strong syntactic differentiation by age, we show that the syntactic knowledge about the training data can be helpful in interpreting model performance on linguistic tasks. For curriculum learning, we explore developmental and several alternative cognitively inspired curriculum approaches. We find that some curricula help with reading tasks, but the main performance improvement come from using the subset of syntactically categorizable data, rather than the full noisy corpus."
}Markdown (Informal)
[Do Syntactic Categories Help in Developmentally Motivated Curriculum Learning for Language Models?](https://preview.aclanthology.org/ingest-emnlp/2025.babylm-main.22/) (Güven et al., BabyLM 2025)
ACL