@inproceedings{liu-etal-2025-r,
title = "{R}-{L}o{RA}: Randomized Multi-Head {L}o{RA} for Efficient Multi-task Learning",
author = "Liu, Jinda and
Chang, Yi and
Wu, Yuan",
editor = "Christodoulopoulos, Christos and
Chakraborty, Tanmoy and
Rose, Carolyn and
Peng, Violet",
booktitle = "Findings of the Association for Computational Linguistics: EMNLP 2025",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.35/",
doi = "10.18653/v1/2025.findings-emnlp.35",
pages = "660--674",
ISBN = "979-8-89176-335-7",
abstract = "Fine-tuning large language models (LLMs) is computationally expensive, and Low-Rank Adaptation (LoRA) provides a cost-effective solution by approximating weight updates through low-rank matrices. In real-world scenarios, LLMs are fine-tuned on data from multiple domains to perform tasks across various fields, embodying multi-task learning (MTL). LoRA often underperforms in such complex scenarios. To enhance LoRA{'}s capability in multi-task learning, we propose R-LoRA, which incorporates Multi-Head Randomization. Multi-Head Randomization diversifies the head matrices through Multi-Head Dropout and Multi-Head Random Initialization, enabling more efficient learning of task-specific features while maintaining shared knowledge representation. Our approach not only improves performance in MTL but also reduces GPU memory usage and training time. Experiments show that R-LoRA{'}s gains stem from increased diversity in the head matrices, demonstrating its effectiveness for multi-task learning. The code is open-sourced."
}Markdown (Informal)
[R-LoRA: Randomized Multi-Head LoRA for Efficient Multi-task Learning](https://preview.aclanthology.org/author-page-yu-wang-polytechnic/2025.findings-emnlp.35/) (Liu et al., Findings 2025)
ACL