@inproceedings{ebb1d1af215a4109a881c3f9b8fb382b,
title = "SEMSTAMP: A Semantic Watermark with Paraphrastic Robustness for Text Generation",
abstract = "Existing watermarked generation algorithms employ token-level designs and therefore, are vulnerable to paraphrase attacks. To address this issue, we introduce watermarking on the semantic representation of sentences. We propose SEMSTAMP, a robust sentence-level semantic watermarking algorithm that uses locality-sensitive hashing (LSH) to partition the semantic space of sentences. The algorithm encodes and LSH-hashes a candidate sentence generated by a language model, and conducts rejection sampling until the sampled sentence falls in watermarked partitions in the semantic embedding space. To test the paraphrastic robustness of watermarking algorithms, we propose a “bigram paraphrase” attack that produces paraphrases with small bigram overlap with the original sentence. This attack is shown to be effective against existing token-level watermark algorithms, while posing only minor degradations to SEMSTAMP. Experimental results show that our novel semantic watermark algorithm is not only more robust than the previous state-of-the-art method on various paraphrasers and domains, but also better at preserving the quality of generation.",
author = "Hou, \{Abe Bohan\} and Jingyu Zhang and Tianxing He and Yichen Wang and Chuang, \{Yung Sung\} and Hongwei Wang and Lingfeng Shen and \{Van Durme\}, Benjamin and Daniel Khashabi and Yulia Tsvetkov",
note = "Publisher Copyright: {\textcopyright}2024 Association for Computational Linguistics.; 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2024 ; Conference date: 16-06-2024 Through 21-06-2024",
year = "2024",
doi = "10.18653/v1/2024.naacl-long.226",
language = "英语",
series = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2024",
publisher = "Association for Computational Linguistics (ACL)",
pages = "4067--4082",
editor = "Kevin Duh and Helena Gomez and Steven Bethard",
booktitle = "Long Papers",
}