@inproceedings{wang-etal-2024-answer, title = "Do-Not-Answer: Evaluating Safeguards in {LLM}s", author = "Wang, Yuxia and Li, Haonan and Han, Xudong and Nakov, Preslav and Baldwin, Timothy", editor = "Graham, Yvette and Purver, Matthew", booktitle = "Findings of the Association for Computational Linguistics: EACL 2024", month = mar, year = "2024", address = "St. Julian{'}s, Malta", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.findings-eacl.61/", pages = "896--911" }