@inproceedings{xia-etal-2023-training, title = "Training Trajectories of Language Models Across Scales", author = "Xia, Mengzhou and Artetxe, Mikel and Zhou, Chunting and Lin, Xi Victoria and Pasunuru, Ramakanth and Chen, Danqi and Zettlemoyer, Luke and Stoyanov, Veselin", editor = "Rogers, Anna and Boyd-Graber, Jordan and Okazaki, Naoaki", booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)", month = jul, year = "2023", address = "Toronto, Canada", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2023.acl-long.767/", doi = "10.18653/v1/2023.acl-long.767", pages = "13711--13738" }