@inproceedings{dragomir-etal-2026-clewr,
title = "{CL}ew{R}: Curriculum Learning with Restarts for Machine Translation Preference Learning",
author = "Dragomir, Alexandra and
Brad, Florin and
Ionescu, Radu Tudor",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1024/",
pages = "20485--20496",
ISBN = "979-8-89176-395-1",
abstract = "Large language models (LLMs) have demonstrated competitive performance in zero-shot multilingual machine translation (MT). Some follow-up works further improved MT performance via preference optimization, but they leave a key aspect largely underexplored: the order in which data samples are given during training. We address this topic by integrating curriculum learning into various state-of-the-art preference optimization algorithms to boost MT performance. We introduce a novel curriculum learning strategy with restarts (CLewR), which reiterates easy-to-hard curriculum multiple times during training to effectively mitigate the catastrophic forgetting of easy examples. We demonstrate consistent gains across several model families (Gemma2, Qwen2.5, Llama3.1) and preference optimization techniques. We publicly release our code at https://github.com/alexandra-dragomir/CLewR."
}Markdown (Informal)
[CLewR: Curriculum Learning with Restarts for Machine Translation Preference Learning](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1024/) (Dragomir et al., Findings 2026)
ACL