@inproceedings{jiang-etal-2026-leveraging,
title = "Leveraging Human and Machine Preferences for Zero-shot Detection of {AI}-Generated Text",
author = "Jiang, Lei and
Wu, Desheng and
Zheng, Xiaolong and
Luo, Cuicui",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.671/",
pages = "13732--13750",
ISBN = "979-8-89176-395-1",
abstract = "In recent years, the rapid advancement of large language models (LLMs) has enabled generated texts to closely mimic human writing, posing significant challenges to the detection of AI-generated content. Current mainstream zero-shot detection methods largely adopt a machine-centric perspective, relying on proxy models to compute token-level AI-likelihood scores and treating all tokens equally during overall detection. However, such approaches overlook the prediction discrepancies that arise when humans and large language models interpret the same text. We argue that tokens exhibiting greater divergence between human and machine predictions can provide stronger clues for determining the authorship of a text. To address this limitation, we propose \textbf{HAPDA}{---}a human-machine prediction discrepancy adapter for AI-generated text detection (AGTD). The framework consists of two core components: (1) a joint fine-tuning strategy for training paired human-preference and machine-preference models, and (2) a discrepancy-aware reweighting mechanism designed to calibrate token-level detection scores in downstream detectors. Extensive experiments demonstrate that HAPDA consistently and significantly enhances the detection performance of five representative baseline models under various evaluation scenarios."
}Markdown (Informal)
[Leveraging Human and Machine Preferences for Zero-shot Detection of AI-Generated Text](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.671/) (Jiang et al., Findings 2026)
ACL