@inproceedings{huang-etal-2026-gmfl,
title = "{GMFL}: Efficient Global Masking for Federated {LLM} Fine-tuning",
author = "Huang, Xin and
Hu, Yan and
Gong, Yue-Jiao and
Zhang, Xinglin",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1160/",
pages = "25293--25312",
ISBN = "979-8-89176-390-6",
abstract = "Low-Rank Adaptation (LoRA) has emerged as a prominent solution to mitigate the communication and computation costs in federated fine-tuning of Large Language Models (LLMs). However, we observe that even within low-rank adapters, a substantial portion of parameters manifest negligible updates during federated training, leading to redundant communication and wasted local computation. To address this, we propose \textbf{GMFL}, a \textbf{plug-and-play} layer freezing mechanism designed to \textbf{seamlessly integrate} with existing federated fine-tuning frameworks. Specifically, the server monitors the global update magnitude of each LoRA layer to dynamically generate freezing masks. These masks are updated periodically with a fixed freezing rate, ensuring stable convergence by robustly identifying ``saturated'' layers. Theoretical analysis confirms the convergence of GMFL, where the freezing mechanism yields a bounded error that scales with client heterogeneity. Extensive experiments across multiple tasks (GLUE, Commonsense Reasoning, Math Reasoning and General Generation) demonstrate that GMFL reduces communication overhead and lowers computational costs while preserving the performance of the underlying federated fine-tuning methods. Our work provides a practical, versatile solution for deploying large-scale federated LLM fine-tuning in resource-constrained environments. Our code is available at: \url{https://github.com/tunx-cyber/GMFL}."
}Markdown (Informal)
[GMFL: Efficient Global Masking for Federated LLM Fine-tuning](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1160/) (Huang et al., ACL 2026)
ACL
- Xin Huang, Yan Hu, Yue-Jiao Gong, and Xinglin Zhang. 2026. GMFL: Efficient Global Masking for Federated LLM Fine-tuning. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 25293–25312, San Diego, California, United States. Association for Computational Linguistics.