@inproceedings{zhang-etal-2024-random,
title = "Random Smooth-based Certified Defense against Text Adversarial Attack",
author = "Zhang, Zeliang and
Yao, Wei and
Liang, Susan and
Xu, Chenliang",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Findings of the Association for Computational Linguistics: EACL 2024",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-eacl.83/",
pages = "1251--1265",
abstract = "Certified defense methods have identified their effectiveness against textual adversarial examples, which train models on the worst-case text generated by substituting words in original texts with synonyms. However, due to the discrete word embedding representations, the large search space hinders the robust training efficiency, resulting in significant time consumption. To overcome this challenge, motivated by the observation that synonym embedding has a small distance, we propose to treat the word substitution as a continuous perturbation on the word embedding representation. The proposed method Text-RS applies random smooth techniques to approximate the word substitution operation, offering a computationally efficient solution that outperforms conventional discrete methods and improves the robustness in training. The evaluation results demonstrate its effectiveness in defending against multiple textual adversarial attacks."
}
Markdown (Informal)
[Random Smooth-based Certified Defense against Text Adversarial Attack](https://preview.aclanthology.org/add-emnlp-2024-awards/2024.findings-eacl.83/) (Zhang et al., Findings 2024)
ACL