@inproceedings{yan-etal-2026-text,
title = "Text-Guided Multi-Scale Frequency Representation Adaptation",
author = "Yan, Weicai and
Ma, Xinhua and
Lin, Wang and
Jin, Tao",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.1108/",
pages = "24169--24187",
ISBN = "979-8-89176-390-6",
abstract = "Parameter-efficient fine-tuning methods introduce a small number of training parameters, enabling pre-trained models to adapt rapidly to new data distributions. While these methods have shown promising results, they exhibit notable limitations. First, most existing methods operate in the signal space domain, which results in substantial information redundancy. Second, most existing methods utilize fixed prompts or adaptation layers, failing to fully account for the multi-scale characteristics of signals. To address these challenges, we propose the Multi-Scale \textbf{Freq}uency \textbf{Adapter} (FreqAdapter), which integrates textual information and performs multi-scale fine-tuning of visual signal in the frequency domain. Additionally, we introduce a multi-scale adaptation strategy to optimize receptive fields across different frequency ranges, further enhancing the model{'}s representational capacity. Extensive experiments on multimodal models, including CLIP and LLaVA, demonstrate that FreqAdapter significantly improves both performance and efficiency. FreqAdapter improves performance with minimal cost and fast convergence within one epoch."
}Markdown (Informal)
[Text-Guided Multi-Scale Frequency Representation Adaptation](https://preview.aclanthology.org/ingest-acl/2026.acl-long.1108/) (Yan et al., ACL 2026)
ACL
- Weicai Yan, Xinhua Ma, Wang Lin, and Tao Jin. 2026. Text-Guided Multi-Scale Frequency Representation Adaptation. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 24169–24187, San Diego, California, United States. Association for Computational Linguistics.