@inproceedings{sood-dandapat-2023-problematic,
title = "Problematic Webpage Identification: A Trilogy of Hatespeech, Search Engines and {GPT}",
author = "Sood, Ojasvin and
Dandapat, Sandipan",
editor = "Chung, Yi-ling and
R{\{}{\textbackslash}{''}ottger{\}}, Paul and
Nozza, Debora and
Talat, Zeerak and
Mostafazadeh Davani, Aida",
booktitle = "The 7th Workshop on Online Abuse and Harms (WOAH)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest_wac_2008/2023.woah-1.13/",
doi = "10.18653/v1/2023.woah-1.13",
pages = "126--137",
abstract = "In this paper, we introduce a fine-tuned transformer-based model focused on problematic webpage classification to identify webpages promoting hate and violence of various forms. Due to the unavailability of labelled problematic webpage data, first we propose a novel webpage data collection strategy which leverages well-studied short-text hate speech datasets. We have introduced a custom GPT-4 few-shot prompt annotation scheme taking various webpage features to label the prohibitively expensive webpage annotation task. The resulting annotated data is used to build our problematic webpage classification model. We report the accuracy (87.6{\%} F1-score) of our webpage classification model and conduct a detailed comparison of it against other state-of-the-art hate speech classification model on problematic webpage identification task. Finally, we have showcased the importance of various webpage features in identifying a problematic webpage."
}
Markdown (Informal)
[Problematic Webpage Identification: A Trilogy of Hatespeech, Search Engines and GPT](https://preview.aclanthology.org/ingest_wac_2008/2023.woah-1.13/) (Sood & Dandapat, WOAH 2023)
ACL