@inproceedings{fillies-etal-2025-comprehensive,
title = "A Comprehensive Taxonomy of Bias Mitigation Methods for Hate Speech Detection",
author = "Fillies, Jan and
Wawerek, Marius and
Paschke, Adrian",
editor = "Calabrese, Agostina and
de Kock, Christine and
Nozza, Debora and
Plaza-del-Arco, Flor Miriam and
Talat, Zeerak and
Vargas, Francielle",
booktitle = "Proceedings of the The 9th Workshop on Online Abuse and Harms (WOAH)",
month = aug,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/landing_page/2025.woah-1.1/",
pages = "1--16",
ISBN = "979-8-89176-105-6",
abstract = "Algorithmic hate speech detection is widely used today. However, biases within these systems can lead to discrimination. This research presents an overview of bias mitigation strategies in the field of hate speech detection. The identified principles are grouped into four categories, based on their operation principles. A novel taxonomy of bias mitigation methods is proposed. The mitigation strategies are characterized based on their key concepts and analyzed in terms of their application stage and their need for knowledge of protected attributes. Additionally, the paper discusses potential combinations of these strategies. This research shifts the focus from identifying present biases to examining the similarities and differences between mitigation strategies, thereby facilitating the exchange, stacking, and ensembling of these strategies in future research."
}
Markdown (Informal)
[A Comprehensive Taxonomy of Bias Mitigation Methods for Hate Speech Detection](https://preview.aclanthology.org/landing_page/2025.woah-1.1/) (Fillies et al., WOAH 2025)
ACL