@inproceedings{brooks-etal-2024-rise,
title = "The Rise of {AI}-Generated Content in {W}ikipedia",
author = "Brooks, Creston and
Eggert, Samuel and
Peskoff, Denis",
editor = "Lucie-Aim{\'e}e, Lucie and
Fan, Angela and
Gwadabe, Tajuddeen and
Johnson, Isaac and
Petroni, Fabio and
van Strien, Daniel",
booktitle = "Proceedings of the First Workshop on Advancing Natural Language Processing for Wikipedia",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/fix-sig-urls/2024.wikinlp-1.12/",
doi = "10.18653/v1/2024.wikinlp-1.12",
pages = "67--79",
abstract = "The rise of AI-generated content in popular information sources raises significant concerns about accountability, accuracy, and bias amplification. Beyond directly impacting consumers, the widespread presence of this content poses questions for the long-term viability of training language models on vast internet sweeps. We use GPTZero, a proprietary AI detector, and Binoculars, an open-source alternative, to establish lower bounds on the presence of AI-generated content in recently created Wikipedia pages. Both detectors reveal a marked increase in AI-generated content in recent pages compared to those from before the release of GPT-3.5. With thresholds calibrated to achieve a 1{\%} false positive rate on pre-GPT-3.5 articles, detectors flag over 5{\%} of newly created English Wikipedia articles as AI-generated, with lower percentages for German, French, and Italian articles. Flagged Wikipedia articles are typically of lower quality and are often self-promotional or partial towards a specific viewpoint on controversial topics."
}
Markdown (Informal)
[The Rise of AI-Generated Content in Wikipedia](https://preview.aclanthology.org/fix-sig-urls/2024.wikinlp-1.12/) (Brooks et al., WikiNLP 2024)
ACL
- Creston Brooks, Samuel Eggert, and Denis Peskoff. 2024. The Rise of AI-Generated Content in Wikipedia. In Proceedings of the First Workshop on Advancing Natural Language Processing for Wikipedia, pages 67–79, Miami, Florida, USA. Association for Computational Linguistics.