@inproceedings{wu-etal-2026-imbalanced, title = "Imbalanced Gradients in {RL} Post-Training of Multi-Task {LLM}s", author = "Wu, Runzhe and Samanta, Ankur and Jain, Ayush and Fujimoto, Scott and Kwon, Jeongyeol and Kretzu, Ben and Yu, Youliang and Hassani, Kaveh and Vidolov, Boris and Efroni, Yonathan", editor = "Demberg, Vera and Inui, Kentaro and Marquez, Llu{\'i}s", booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {EACL} 2026", month = mar, year = "2026", address = "Rabat, Morocco", publisher = "Association for Computational Linguistics", url = "https://preview.aclanthology.org/ingest-eacl/2026.findings-eacl.164/", pages = "3137--3150", ISBN = "979-8-89176-386-9" }