@inproceedings{hao-etal-2025-learning,
title = "Learning to Rewrite: Generalized {LLM}-Generated Text Detection",
author = "Hao, Wei and
Li, Ran and
Zhao, Weiliang and
Yang, Junfeng and
Mao, Chengzhi",
editor = "Che, Wanxiang and
Nabende, Joyce and
Shutova, Ekaterina and
Pilehvar, Mohammad Taher",
booktitle = "Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2025",
address = "Vienna, Austria",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.322/",
pages = "6421--6434",
ISBN = "979-8-89176-251-0",
abstract = "Detecting text generated by Large Language Models (LLMs) is crucial, yet current detectors often struggle to generalize in open-world settings. We introduce Learning2Rewrite, a novel framework to detect LLM-generated text with exceptional generalization to unseen domains. Capitalized on the finding that LLMs inherently modify LLM-generated content less than human-written text when rewriting, we train an LLM to amplify this disparity, yielding a more distinguishable and generalizable edit distance across diverse text distributions. Extensive experiments on data from 21 independent domains and four major LLMs (GPT-3.5, GPT-4, Gemini, and Llama-3) demonstrate that our detector outperforms state-of-the-art detection methods by up to 23.04{\%} in AUROC for in-distribution tests, 35.10{\%} for out-of-distribution tests, and 48.66{\%} under adversarial attacks. Our unique training objective ensures better generalizability compared to directly training for classification, even when leveraging the same amount of tunable parameters. Our findings suggest that reinforcing LLMs' inherent rewriting tendencies offers a robust and scalable solution for detecting LLM-generated text."
}
Markdown (Informal)
[Learning to Rewrite: Generalized LLM-Generated Text Detection](https://preview.aclanthology.org/ingestion-acl-25/2025.acl-long.322/) (Hao et al., ACL 2025)
ACL
- Wei Hao, Ran Li, Weiliang Zhao, Junfeng Yang, and Chengzhi Mao. 2025. Learning to Rewrite: Generalized LLM-Generated Text Detection. In Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 6421–6434, Vienna, Austria. Association for Computational Linguistics.