@inproceedings{noh-song-2026-babylms,
title = "Do {B}aby{LM}s Wanna Learn Wanna Contraction? On the Learnability without Language-Specific Bias",
author = "Noh, Kangsan and
Song, Sanghoun",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.552/",
pages = "11361--11372",
ISBN = "979-8-89176-395-1",
abstract = "This study investigates whether the grammatical constraints on wanna contraction{---}a phenomenon traditionally cited as evidence for innate linguistic knowledge{---}can be learned via BabyLMs, which are designed to reflect cognitively plausible learning conditions. Two datasets were constructed from the CHILDES corpus, varying in embedded verb frequency (high vs. low) and grammaticality, and contrasting grammatical instances (object extraction contexts) with ungrammatical ones (subject extraction contexts) of wanna contractions. Using surprisal as a metric, we evaluated 24 BabyLMs from the 2024 BabyLM Challenge alongside four standard models, including BERT and GPT-2. While the standard models performed with near-perfect consistency, the BabyLMs showed modest but meaningful sensitivity, particularly those trained on larger datasets and tested on high-frequency wanna instances. In particular, only encoder-based BabyLMs captured the grammatical constraint, with babylm24{\_}MLSM exhibiting consistent performance. Nonetheless, our findings provide evidence for limited and conditional learnability of wanna contraction by artificial learners under cognitively realistic input conditions."
}Markdown (Informal)
[Do BabyLMs Wanna Learn Wanna Contraction? On the Learnability without Language-Specific Bias](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.552/) (Noh & Song, Findings 2026)
ACL