@inproceedings{kubik-etal-2025-enhancing,
title = "Enhancing {BERT} Fine-Tuning for Sentiment Analysis in Lower-Resourced Languages",
author = "Kub{\'i}k, Jozef and
Suppa, Marek and
Takac, Martin",
editor = "Inui, Kentaro and
Sakti, Sakriani and
Wang, Haofen and
Wong, Derek F. and
Bhattacharyya, Pushpak and
Banerjee, Biplab and
Ekbal, Asif and
Chakraborty, Tanmoy and
Singh, Dhirendra Pratap",
booktitle = "Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics",
month = dec,
year = "2025",
address = "Mumbai, India",
publisher = "The Asian Federation of Natural Language Processing and The Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.ijcnlp-short.23/",
pages = "260--272",
ISBN = "979-8-89176-299-2",
abstract = "Limited data for low-resource languages typically yields weaker language models (LMs). Since pre-training is compute-intensive, it is more pragmatic to target improvements during fine-tuning. In this work, we examine the use of Active Learning (AL) methods augmented by structured data selection strategies across epochs, which we term `Active Learning schedulers,' to boost the fine-tuning process with a limited amount of training data. We connect the AL process to data clustering and propose an integrated fine-tuning pipeline that systematically combines AL, data clustering, and dynamic data selection schedulers to enhance models' performance. Several experiments on the Slovak, Maltese, Icelandic, and Turkish languages show that the use of clustering during the fine-tuning phase together with novel AL scheduling can for models simultaneously yield annotation savings up to 30{\%} and performance improvements up to four F1 score points, while also providing better fine-tuning stability."
}Markdown (Informal)
[Enhancing BERT Fine-Tuning for Sentiment Analysis in Lower-Resourced Languages](https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.ijcnlp-short.23/) (Kubík et al., IJCNLP-AACL 2025)
ACL
- Jozef Kubík, Marek Suppa, and Martin Takac. 2025. Enhancing BERT Fine-Tuning for Sentiment Analysis in Lower-Resourced Languages. In Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics, pages 260–272, Mumbai, India. The Asian Federation of Natural Language Processing and The Association for Computational Linguistics.