@inproceedings{loerakker-etal-2024-fine,
title = "Fine-Tuning Language Models on {D}utch Protest Event Tweets",
author = {Loerakker, Meagan and
M{\"u}ter, Laurens and
Schraagen, Marijn},
editor = {H{\"u}rriyeto{\u{g}}lu, Ali and
Tanev, Hristo and
Thapa, Surendrabikram and
Uludo{\u{g}}an, G{\"o}k{\c{c}}e},
booktitle = "Proceedings of the 7th Workshop on Challenges and Applications of Automated Extraction of Socio-political Events from Text (CASE 2024)",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.case-1.2",
pages = "6--23",
abstract = "Being able to obtain timely information about an event, like a protest, becomes increasingly more relevant with the rise of affective polarisation and social unrest over the world. Nowadays, large-scale protests tend to be organised and broadcast through social media. Analysing social media platforms like X has proven to be an effective method to follow events during a protest. Thus, we trained several language models on Dutch tweets to analyse their ability to classify if a tweet expresses discontent, considering these tweets may contain practical information about a protest. Our results show that models pre-trained on Twitter data, including Bernice and TwHIN-BERT, outperform models that are not. Additionally, the results showed that Sentence Transformers is a promising model. The added value of oversampling is greater for models that were not trained on Twitter data. In line with previous work, pre-processing the data did not help a transformer language model to make better predictions.",
}
Markdown (Informal)
[Fine-Tuning Language Models on Dutch Protest Event Tweets](https://aclanthology.org/2024.case-1.2) (Loerakker et al., CASE-WS 2024)
ACL
- Meagan Loerakker, Laurens Müter, and Marijn Schraagen. 2024. Fine-Tuning Language Models on Dutch Protest Event Tweets. In Proceedings of the 7th Workshop on Challenges and Applications of Automated Extraction of Socio-political Events from Text (CASE 2024), pages 6–23, St. Julians, Malta. Association for Computational Linguistics.