@inproceedings{lei-etal-2024-fast,
title = "Fast Randomized Low-Rank Adaptation of Pre-trained Language Models with {PAC} Regularization",
author = "Lei, Zijian and
Qian, Dong and
Cheung, William",
editor = "Ku, Lun-Wei and
Martins, Andre and
Srikumar, Vivek",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2024",
month = aug,
year = "2024",
address = "Bangkok, Thailand",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.findings-acl.310/",
doi = "10.18653/v1/2024.findings-acl.310",
pages = "5236--5249",
abstract = "Low-rank adaptation (LoRA) achieves parameter efficient fine-tuning for large language models (LLMs) by decomposing the model weight update into a pair of low-rank projection matrices. Yet, the memory overhead restricts it to scale up when the model size increases. We propose Randomized LoRA (RLoRA) which adopts Randomized Walsh-Hadamard Transform to achieve significant reduction in the size of trainable parameters compared to LoRA. At the same time, it allows a PAC-Bayes regularizer to be efficiently incorporated to improve generalization. We evaluate the effectiveness of RLoRA on LLMs RoBERTa, GPT-2 and LLaMA-7B using GLUE, E2E and math reasoning benchmarks. With a much lower memory requirement, RLoRA can give similar performance as the SOTA low-rank adaptation methods for these three tasks and significantly better performance under few-shot settings."
}
Markdown (Informal)
[Fast Randomized Low-Rank Adaptation of Pre-trained Language Models with PAC Regularization](https://preview.aclanthology.org/fix-sig-urls/2024.findings-acl.310/) (Lei et al., Findings 2024)
ACL