@inproceedings{ranaldi-etal-2023-modeling,
title = "Modeling Easiness for Training Transformers with Curriculum Learning",
author = "Ranaldi, Leonardo and
Pucci, Giulia and
Zanzotto, Fabio Massimo",
editor = "Mitkov, Ruslan and
Angelova, Galia",
booktitle = "Proceedings of the 14th International Conference on Recent Advances in Natural Language Processing",
month = sep,
year = "2023",
address = "Varna, Bulgaria",
publisher = "INCOMA Ltd., Shoumen, Bulgaria",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2023.ranlp-1.101/",
pages = "937--948",
abstract = "Directly learning from complex examples is generally problematic for humans and machines. Indeed, a better strategy is exposing learners to examples in a reasonable, pedagogically-motivated order. Curriculum Learning (CL) has been proposed to import this strategy when training machine learning models. In this paper, building on Curriculum Learning, we propose a novel, linguistically motivated measure to determine example complexity for organizing examples during learning. Our complexity measure - LRC- is based on length, rarity, and comprehensibility. Our resulting learning model is CL-LRC, that is, CL with LRC. Experiments on downstream tasks show that CL-LRC outperforms existing CL and non-CL methods for training BERT and RoBERTa from scratch. Furthermore, we analyzed different measures, including perplexity, loss, and learning curve of different models pre-trained from scratch, showing that CL-LRC performs better than the state-of-the-art."
}
Markdown (Informal)
[Modeling Easiness for Training Transformers with Curriculum Learning](https://preview.aclanthology.org/add-emnlp-2024-awards/2023.ranlp-1.101/) (Ranaldi et al., RANLP 2023)
ACL