@proceedings{babylm-2025-main,
    title = "Proceedings of the First BabyLM Workshop",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.0/",
    doi = "10.18653/v1/2025.babylm-main.0",
    ISBN = "TODO"
}
@inproceedings{velasco-roque-2025-rethinking,
    title = "Rethinking the Role of Text Complexity in Language Model Pretraining",
    author = "Velasco, Dan John  and
      Roque, Matthew Theodore",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.1/",
    doi = "10.18653/v1/2025.babylm-main.1",
    pages = "1--28",
    ISBN = "TODO"
}
@inproceedings{ulm-etal-2025-contrastive,
    title = "Contrastive Decoding for Synthetic Data Generation in Low-Resource Language Modeling",
    author = "Ulm, Jannek  and
      Du, Kevin  and
      Sn{\ae}bjarnarson, V{\'e}steinn",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.2/",
    doi = "10.18653/v1/2025.babylm-main.2",
    pages = "29--41",
    ISBN = "TODO"
}
@inproceedings{mehta-etal-2025-unifying,
    title = "Unifying Mixture of Experts and Multi-Head Latent Attention for Efficient Language Models",
    author = "Mehta, Sushant  and
      Dandekar, Raj  and
      Dandekar, Rajat  and
      Panat, Sreedath",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.3/",
    doi = "10.18653/v1/2025.babylm-main.3",
    pages = "42--51",
    ISBN = "TODO"
}
@inproceedings{askari-etal-2025-babylms,
    title = "Are {B}aby{LM}s Deaf to {G}ricean Maxims? A Pragmatic Evaluation of Sample-efficient Language Models",
    author = {Askari, Raha  and
      Zarrie{\ss}, Sina  and
      Alacam, {\"O}zge  and
      Sieker, Judith},
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.4/",
    doi = "10.18653/v1/2025.babylm-main.4",
    pages = "52--65",
    ISBN = "TODO"
}
@inproceedings{takmaz-etal-2025-model,
    title = "Model Merging to Maintain Language-Only Performance in Developmentally Plausible Multimodal Models",
    author = "Takmaz, Ece  and
      Bylinina, Lisa  and
      Dotlacil, Jakub",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.5/",
    doi = "10.18653/v1/2025.babylm-main.5",
    pages = "66--75",
    ISBN = "TODO"
}
@inproceedings{gelboim-sulem-2025-tafberta,
    title = "{T}af{BERT}a: Learning Grammatical Rules from Small-Scale Language Acquisition Data in {H}ebrew",
    author = "Gelboim, Anita  and
      Sulem, Elior",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.6/",
    doi = "10.18653/v1/2025.babylm-main.6",
    pages = "76--90",
    ISBN = "TODO"
}
@inproceedings{rui-miura-2025-forgetter,
    title = "{FORGETTER} with forgetful hyperparameters and recurring sleeps can continue to learn beyond normal overtfitting limits",
    author = "Rui, Yamamoto  and
      Miura, Keiji",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.7/",
    doi = "10.18653/v1/2025.babylm-main.7",
    pages = "91--99",
    ISBN = "TODO"
}
@inproceedings{fiandra-etal-2025-large,
    title = "Large Language Models and Children Have Different Learning Trajectories in Determiner Acquisition",
    author = "Fiandra, Olivia La  and
      Fernandez Echeverri, Nathalie  and
      Shafto, Patrick  and
      Feldman, Naomi H.",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.8/",
    doi = "10.18653/v1/2025.babylm-main.8",
    pages = "100--108",
    ISBN = "TODO"
}
@inproceedings{hsiao-dutta-2025-design,
    title = "Design and Analysis of few Million Parameter Transformer-based Language Models trained over a few Million Tokens Dataset",
    author = "Hsiao, Yen-Che  and
      Dutta, Abhishek",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.9/",
    doi = "10.18653/v1/2025.babylm-main.9",
    pages = "109--129",
    ISBN = "TODO"
}
@inproceedings{salhan-etal-2025-best,
    title = "What is the Best Sequence Length for {B}aby{LM}?",
    author = "Salhan, Suchir  and
      Diehl Martinez, Richard  and
      Goriely, Z{\'e}bulon  and
      Buttery, Paula",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.10/",
    doi = "10.18653/v1/2025.babylm-main.10",
    pages = "130--146",
    ISBN = "TODO"
}
@inproceedings{aman-etal-2025-bitmar,
    title = "{B}it{M}ar: Low-Bit Multimodal Fusion with Episodic Memory for Edge Devices",
    author = "Aman, Euhid  and
      Carlin, Esteban  and
      Pao, Hsing-Kuo Kenneth  and
      Beltrame, Giovanni  and
      Sari, Ghaluh Indah Permata  and
      Chen, Yie-Tarng",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.11/",
    doi = "10.18653/v1/2025.babylm-main.11",
    pages = "147--154",
    ISBN = "TODO"
}
@inproceedings{loaiciga-etal-2025-exploring,
    title = "Exploring smaller batch sizes for a high-performing {B}aby{LM} model architecture",
    author = "Lo{\'a}iciga, Sharid  and
      Fysikoudi, Eleni  and
      Sayeed, Asad B.",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.12/",
    doi = "10.18653/v1/2025.babylm-main.12",
    pages = "155--159",
    ISBN = "TODO"
}
@inproceedings{gao-etal-2025-bliss,
    title = "{BL}i{SS}: Evaluating Bilingual Learner Competence in Second Language Small Language Models",
    author = "Gao, Yuan  and
      Salhan, Suchir  and
      Caines, Andrew  and
      Buttery, Paula  and
      Sun, Weiwei",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.13/",
    doi = "10.18653/v1/2025.babylm-main.13",
    pages = "160--174",
    ISBN = "TODO"
}
@inproceedings{haller-etal-2025-sample,
    title = "Sample-Efficient Language Modeling with Linear Attention and Lightweight Enhancements",
    author = "Haller, Patrick  and
      Golde, Jonas  and
      Akbik, Alan",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.14/",
    doi = "10.18653/v1/2025.babylm-main.14",
    pages = "175--191",
    ISBN = "TODO"
}
@inproceedings{ganescu-etal-2025-looking,
    title = "Looking to Learn: Token-wise Dynamic Gating for Low-Resource Vision-Language Modelling",
    author = "Ganescu, Bianca-Mihaela  and
      Salhan, Suchir  and
      Caines, Andrew  and
      Buttery, Paula",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.15/",
    doi = "10.18653/v1/2025.babylm-main.15",
    pages = "192--217",
    ISBN = "TODO"
}
@inproceedings{papusoi-nisioi-2025-comparison,
    title = "A Comparison of Elementary Baselines for {B}aby{LM}",
    author = "P{\u{a}}pușoi, Rareș  and
      Nisioi, Sergiu",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.16/",
    doi = "10.18653/v1/2025.babylm-main.16",
    pages = "218--225",
    ISBN = "TODO"
}
@inproceedings{mccurdy-etal-2025-two,
    title = "Two ways into the hall of mirrors: Language exposure and lossy memory drive cross-linguistic grammaticality illusions in language models",
    author = "McCurdy, Kate  and
      Christian, Katharina  and
      Seyfried, Amelie  and
      Sonkin, Mikhail",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.17/",
    doi = "10.18653/v1/2025.babylm-main.17",
    pages = "226--236",
    ISBN = "TODO"
}
@inproceedings{poh-etal-2025-say,
    title = "What did you say? Generating Child-Directed Speech Questions to Train {LLM}s",
    author = "Poh, Whitney  and
      Tombolini, Michael  and
      Barak, Libby",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.18/",
    doi = "10.18653/v1/2025.babylm-main.18",
    pages = "237--245",
    ISBN = "TODO"
}
@inproceedings{roque-velasco-2025-beyond,
    title = "Beyond Repetition: Text Simplification and Curriculum Learning for Data-Constrained Pretraining",
    author = "Roque, Matthew Theodore  and
      Velasco, Dan John",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.19/",
    doi = "10.18653/v1/2025.babylm-main.19",
    pages = "246--255",
    ISBN = "TODO"
}
@inproceedings{tankala-etal-2025-curll,
    title = "{C}ur{LL}: A Developmental Framework to Evaluate Continual Learning in Language Models",
    author = "Tankala, Pavan Kalyan  and
      Mishra, Shubhra  and
      Lokam, Satya  and
      Goyal, Navin",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.20/",
    doi = "10.18653/v1/2025.babylm-main.20",
    pages = "256--278",
    ISBN = "TODO"
}
@inproceedings{bolucu-can-2025-morpheme,
    title = "A Morpheme-Aware Child-Inspired Language Model",
    author = {B{\"o}l{\"u}c{\"u}, Necva  and
      Can, Burcu},
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.21/",
    doi = "10.18653/v1/2025.babylm-main.21",
    pages = "279--287",
    ISBN = "TODO"
}
@inproceedings{guven-etal-2025-syntactic,
    title = "Do Syntactic Categories Help in Developmentally Motivated Curriculum Learning for Language Models?",
    author = {G{\"u}ven, Arzu Burcu  and
      Rogers, Anna  and
      Goot, Rob Van Der},
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.22/",
    doi = "10.18653/v1/2025.babylm-main.22",
    pages = "288--300",
    ISBN = "TODO"
}
@inproceedings{kris-suppa-2025-slovakbabylm,
    title = "{S}lovak{B}aby{LM}: Replication of the {B}aby{LM} and Sample-efficient Pretraining for a Low-Resource Language",
    author = "Kri{\v{s}}, {\v{L}}ubo{\v{s}}  and
      Suppa, Marek",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.23/",
    doi = "10.18653/v1/2025.babylm-main.23",
    pages = "301--312",
    ISBN = "TODO"
}
@inproceedings{zain-etal-2025-single,
    title = "Single layer tiny Co4 outpaces {GPT}-2 and {GPT}-{BERT}",
    author = "Zain, Noor Ul  and
      Naseem, Mohsin Raza  and
      Adeel, Ahsan",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.24/",
    doi = "10.18653/v1/2025.babylm-main.24",
    pages = "313--322",
    ISBN = "TODO"
}
@inproceedings{salhan-etal-2025-teacher,
    title = "Teacher Demonstrations in a {B}aby{LM}{'}s Zone of Proximal Development for Contingent Multi-Turn Interaction",
    author = "Salhan, Suchir  and
      Gu, Hongyi  and
      Rooein, Donya  and
      Galvan-Sosa, Diana  and
      Gaudeau, Gabrielle  and
      Caines, Andrew  and
      Yuan, Zheng  and
      Buttery, Paula",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.25/",
    doi = "10.18653/v1/2025.babylm-main.25",
    pages = "323--355",
    ISBN = "TODO"
}
@inproceedings{schoenegger-etal-2025-influence,
    title = "Influence-driven Curriculum Learning for Pre-training on Limited Data",
    author = "Schoenegger, Loris  and
      Thoma, Lukas  and
      Blevins, Terra  and
      Roth, Benjamin",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.26/",
    doi = "10.18653/v1/2025.babylm-main.26",
    pages = "356--379",
    ISBN = "TODO"
}
@inproceedings{lee-etal-2025-understanding,
    title = "Understanding and Enhancing Mamba-Transformer Hybrids for Memory Recall and Language Modeling",
    author = "Lee, Hyunji  and
      Yu, Wenhao  and
      Zhang, Hongming  and
      Ma, Kaixin  and
      Kim, Jiyeon  and
      Yu, Dong  and
      Seo, Minjoon",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.27/",
    doi = "10.18653/v1/2025.babylm-main.27",
    pages = "380--398",
    ISBN = "TODO"
}
@inproceedings{charpentier-etal-2025-findings,
    title = "Findings of the Third {B}aby{LM} Challenge: Accelerating Language Modeling Research with Cognitively Plausible Data",
    author = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.28/",
    doi = "10.18653/v1/2025.babylm-main.28",
    pages = "399--420",
    ISBN = "TODO"
}
@inproceedings{padovani-etal-2025-dialogue,
    title = "Dialogue Is Not Enough to Make a Communicative {B}aby{LM} (But Neither Is Developmentally Inspired Reinforcement Learning)",
    author = "Padovani, Francesca  and
      Bunzeck, Bastian  and
      Ali, Manar  and
      Momen, Omar  and
      Bisazza, Arianna  and
      Buschmeier, Hendrik  and
      Zarrie{\ss}, Sina",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.29/",
    doi = "10.18653/v1/2025.babylm-main.29",
    pages = "421--435",
    ISBN = "TODO"
}
@inproceedings{capone-etal-2025-class,
    title = "{CLASS}-{IT}: Conversational and Lecture-Aligned Small-Scale Instruction Tuning for {B}aby{LM}s",
    author = "Capone, Luca  and
      Bondielli, Alessandro  and
      Lenci, Alessandro",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.30/",
    doi = "10.18653/v1/2025.babylm-main.30",
    pages = "436--444",
    ISBN = "TODO"
}
@inproceedings{edman-fraser-2025-mask,
    title = "Mask and You Shall Receive: Optimizing Masked Language Modeling For Pretraining {B}aby{LM}s",
    author = "Edman, Lukas  and
      Fraser, Alexander",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.31/",
    doi = "10.18653/v1/2025.babylm-main.31",
    pages = "445--453",
    ISBN = "TODO"
}
@inproceedings{martins-etal-2025-upon,
    title = "Once Upon a Time: Interactive Learning for Storytelling with Small Language Models",
    author = "Mayer Martins, Jonas  and
      Bashir, Ali Hamza  and
      Khalid, Muhammad Rehan  and
      Beinborn, Lisa",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.32/",
    doi = "10.18653/v1/2025.babylm-main.32",
    pages = "454--468",
    ISBN = "TODO"
}
@inproceedings{kamzela-etal-2025-llm,
    title = "You are an {LLM} teaching a smaller model everything you know: Multi-task pretraining of language models with {LLM}-designed study plans",
    author = "Kamzela, Wiktor  and
      Lango, Mateusz  and
      Dusek, Ondrej",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.33/",
    doi = "10.18653/v1/2025.babylm-main.33",
    pages = "469--487",
    ISBN = "TODO"
}
@inproceedings{fysikoudi-etal-2025-active,
    title = "Active Curriculum Language Modeling over a Hybrid Pre-training Method",
    author = "Fysikoudi, Eleni  and
      Lo{\'a}iciga, Sharid  and
      Sayeed, Asad B.",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.34/",
    doi = "10.18653/v1/2025.babylm-main.34",
    pages = "488--495",
    ISBN = "TODO"
}
@inproceedings{fusco-etal-2025-linguistic,
    title = "Linguistic Units as Tokens: Intrinsic and Extrinsic Evaluation with {B}aby{LM}",
    author = "Fusco, Achille  and
      Bianchessi, Maria Letizia Piccini  and
      Sgrizzi, Tommaso  and
      Zanollo, Asya  and
      Chesi, Cristiano",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.35/",
    doi = "10.18653/v1/2025.babylm-main.35",
    pages = "496--507",
    ISBN = "TODO"
}
@inproceedings{yoshida-etal-2025-batch,
    title = "Batch-wise Convergent Pre-training: Step-by-Step Learning Inspired by Child Language Development",
    author = "Yoshida, Ko  and
      Shiono, Daiki  and
      Sato, Kai  and
      Miura, Toko  and
      Furuhashi, Momoka  and
      Suzuki, Jun",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.36/",
    doi = "10.18653/v1/2025.babylm-main.36",
    pages = "508--524",
    ISBN = "TODO"
}
@inproceedings{kumar-etal-2025-pretraining,
    title = "Pretraining Language Models with {L}o{RA} and Artificial Languages",
    author = "Kumar, Nalin  and
      Lango, Mateusz  and
      Dusek, Ondrej",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.37/",
    doi = "10.18653/v1/2025.babylm-main.37",
    pages = "525--530",
    ISBN = "TODO"
}
@inproceedings{kosmopoulou-etal-2025-masked,
    title = "Masked Diffusion Language Models with Frequency-Informed Training",
    author = "Kosmopoulou, Despoina  and
      Georgiou, Efthymios  and
      Dorovatas, Vaggelis  and
      Paraskevopoulos, Georgios  and
      Potamianos, Alexandros",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.38/",
    doi = "10.18653/v1/2025.babylm-main.38",
    pages = "531--539",
    ISBN = "TODO"
}
@inproceedings{tapaninaho-2025-moep,
    title = "{M}o{EP}: Modular Expert Paths for Sample-Efficient Language Modeling",
    author = "Tapaninaho, Joonas",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.39/",
    doi = "10.18653/v1/2025.babylm-main.39",
    pages = "540--547",
    ISBN = "TODO"
}
@inproceedings{tampier-etal-2025-recombitext,
    title = "{R}ecombi{T}ext: Compositional Data Augmentation for Enhancing {LLM} Pre-Training Datasets in Low-Resource Scenarios",
    author = "Tampier, Alexander  and
      Thoma, Lukas  and
      Schoenegger, Loris  and
      Roth, Benjamin",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.40/",
    doi = "10.18653/v1/2025.babylm-main.40",
    pages = "548--565",
    ISBN = "TODO"
}
@inproceedings{aynetdinov-akbik-2025-babies,
    title = "Babies Learn to Look Ahead: Multi-Token Prediction in Small {LM}s",
    author = "Aynetdinov, Ansar  and
      Akbik, Alan",
    editor = "Charpentier, Lucas  and
      Choshen, Leshem  and
      Cotterell, Ryan  and
      Gul, Mustafa Omer  and
      Hu, Michael Y.  and
      Liu, Jing  and
      Jumelet, Jaap  and
      Linzen, Tal  and
      Mueller, Aaron  and
      Ross, Candace  and
      Shah, Raj Sanjay  and
      Warstadt, Alex  and
      Wilcox, Ethan Gotlieb  and
      Williams, Adina",
    booktitle = "Proceedings of the First BabyLM Workshop",
    month = nov,
    year = "2025",
    address = "Suzhou, China",
    publisher = "Association for Computational Linguistics",
    url = "https://preview.aclanthology.org/missing-isa-paper/2025.babylm-main.41/",
    pages = "566--577",
    ISBN = "TODO"
}
