@inproceedings{fan-chen-2026-reprohum,
title = "{R}epro{H}um {\#}0866-04: Variability in Human Judgments of Sociopolitical Acceptability Across Studies",
author = "Fan, Rui and
Chen, Guanyi",
editor = "Mille, Simon and
Gehrmann, Sebastian and
Schmidtov{\'a}, Patr{\'i}cia and
Du{\v{s}}ek, Ond{\v{r}}ej and
Fadaee, Marzieh and
Lo, Kyle and
Santus, Enrico and
Stanovsky, Gabriel",
booktitle = "Proceedings of the Fifth Workshop on Generation, Evaluation and Metrics ({GEM})",
month = jul,
year = "2026",
address = "San Diego, California, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.87/",
pages = "1104--1110",
ISBN = "979-8-89176-423-1",
abstract = "Human evaluations are essential for assessing NLP systems, but their reproducibility can be limited when judgments involve socially sensitive constructs. This paper reproduces the perceived sociopolitical acceptability evaluation in (CITATION), where annotators judged whether model-generated writer-intent implications reflected mainstream or fringe viewpoints. Using the same 600 headline{--}belief pairs, we collected new annotations on Prolific and compared our results with both the original study and a prior reproduction. Our scores are lower than the original results. Under a 70{\%} threshold, these findings do not support the original conclusion that most generations were socially acceptable. Overall, our results align more closely with the prior reproduction, while also showing substantial variability, especially for GPT2-large. We argue that this variability may arise from a combination of platform differences, task framing, topic effects, and changes in social context over time. These findings highlight the importance of reporting not only annotation results, but also the evaluation setting in which subjective social judgments are collected."
}Markdown (Informal)
[ReproHum #0866-04: Variability in Human Judgments of Sociopolitical Acceptability Across Studies](https://preview.aclanthology.org/ingest-acl-workshops/2026.gem-main.87/) (Fan & Chen, GEM 2026)
ACL