@inproceedings{kim-etal-2026-marking,
title = "Marking Code Without Breaking It: Code Watermarking for Detecting {LLM}-Generated Code",
author = "Kim, Jungin and
Park, Shinwoo and
Han, Yo-Sub",
editor = "Demberg, Vera and
Inui, Kentaro and
Marquez, Llu{\'i}s",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {EACL} 2026",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/manual-author-scripts/2026.findings-eacl.207/",
pages = "3990--4002",
ISBN = "979-8-89176-386-9",
abstract = "Identifying LLM-generated code through watermarking poses a challenge in preserving functional correctness. Previous methods rely on the assumption that watermarking high-entropy tokens effectively maintains output quality. Our analysis reveals a fundamental limitation of this assumption: syntax-critical tokens such as keywords often exhibit the highest entropy, making existing approaches vulnerable to logic corruption. We present STONE, a syntax-aware watermarking method that embeds watermarks only in non-syntactic tokens and preserves code integrity. For rigorous evaluation, we also introduce STEM, a comprehensive metric that balances three critical dimensions: correctness, detectability, and imperceptibility. Across Python, C++, and Java, STONE preserves correctness, sustains strong detectability, and achieves balanced performance with minimal computational overhead. Our implementation is available at https://github.com/inistory/STONE-watermarking."
}Markdown (Informal)
[Marking Code Without Breaking It: Code Watermarking for Detecting LLM-Generated Code](https://preview.aclanthology.org/manual-author-scripts/2026.findings-eacl.207/) (Kim et al., Findings 2026)
ACL