@inproceedings{meisenbacher-etal-2025-impact,
title = "On the Impact of Noise in Differentially Private Text Rewriting",
author = "Meisenbacher, Stephen and
Chevli, Maulik and
Matthes, Florian",
editor = "Chiruzzo, Luis and
Ritter, Alan and
Wang, Lu",
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2025",
month = apr,
year = "2025",
address = "Albuquerque, New Mexico",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.findings-naacl.32/",
pages = "514--532",
ISBN = "979-8-89176-195-7",
abstract = "The field of text privatization often leverages the notion of *Differential Privacy* (DP) to provide formal guarantees in the rewriting or obfuscation of sensitive textual data. A common and nearly ubiquitous form of DP application necessitates the addition of calibrated noise to vector representations of text, either at the data- or model-level, which is governed by the privacy parameter $\varepsilon$. However, noise addition almost undoubtedly leads to considerable utility loss, thereby highlighting one major drawback of DP in NLP. In this work, we introduce a new sentence infilling privatization technique, and we use this method to explore the effect of noise in DP text rewriting. We empirically demonstrate that non-DP privatization techniques excel in utility preservation and can find an acceptable empirical privacy-utility trade-off, yet cannot outperform DP methods in empirical privacy protections. Our results highlight the significant impact of noise in current DP rewriting mechanisms, leading to a discussion of the merits and challenges of DP in NLP as well as the opportunities that non-DP methods present."
}
Markdown (Informal)
[On the Impact of Noise in Differentially Private Text Rewriting](https://preview.aclanthology.org/Ingest-2025-COMPUTEL/2025.findings-naacl.32/) (Meisenbacher et al., Findings 2025)
ACL