@inproceedings{chen-etal-2026-sparse, title = "Sparse Growing Transformer: Training-Time Sparse Depth Allocation via Progressive Attention Looping", author = "Chen, Yao and Chen, Yilong and Yang, Yinqi and Shang, Junyuan and Zhang, Zhenyu and Zhang, Zefeng and Nie, Shuaiyi and Wang, Shuohuan and Sun, Yu and Wu, Hua and Wang, Haifeng and Liu, Tingwen", editor = "Liakata, Maria and Moreira, Viviane P. and Zhang, Jiajun and Jurgens, David", booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026", month = jul, year = "2026", address = "San Diego, California, United States", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.307/", pages = "6168--6193", ISBN = "979-8-89176-395-1" }