SafeDecoding: Defending against Jailbreak Attacks via Safety-Aware Decoding. Xu, Z., Jiang, F., Niu, L., Jia, J., Lin, B. Y., & Poovendran, R. In 62nd Annual Meeting of the Association for Computational Linguistics (ACL), 2024. bibtex @inproceedings{xu2024safedecoding,
title={SafeDecoding: Defending against Jailbreak Attacks via Safety-Aware Decoding},
author={Xu, Zhangchen and Jiang, Fengqing and Niu, Luyao and Jia, Jinyuan and Lin, Bill Yuchen and Poovendran, Radha},
booktitle={62nd Annual Meeting of the Association for Computational Linguistics (ACL)},
year={2024},
addendum = {\textcolor{blue}{Oral}}
}
Downloads: 0
{"_id":"jmFTB3HbpBhGmjzBS","bibbaseid":"xu-jiang-niu-jia-lin-poovendran-safedecodingdefendingagainstjailbreakattacksviasafetyawaredecoding-2024","author_short":["Xu, Z.","Jiang, F.","Niu, L.","Jia, J.","Lin, B. Y.","Poovendran, R."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","title":"SafeDecoding: Defending against Jailbreak Attacks via Safety-Aware Decoding","author":[{"propositions":[],"lastnames":["Xu"],"firstnames":["Zhangchen"],"suffixes":[]},{"propositions":[],"lastnames":["Jiang"],"firstnames":["Fengqing"],"suffixes":[]},{"propositions":[],"lastnames":["Niu"],"firstnames":["Luyao"],"suffixes":[]},{"propositions":[],"lastnames":["Jia"],"firstnames":["Jinyuan"],"suffixes":[]},{"propositions":[],"lastnames":["Lin"],"firstnames":["Bill","Yuchen"],"suffixes":[]},{"propositions":[],"lastnames":["Poovendran"],"firstnames":["Radha"],"suffixes":[]}],"booktitle":"62nd Annual Meeting of the Association for Computational Linguistics (ACL)","year":"2024","addendum":"\\textcolorblueOral","bibtex":"@inproceedings{xu2024safedecoding,\n\ttitle={SafeDecoding: Defending against Jailbreak Attacks via Safety-Aware Decoding},\n\tauthor={Xu, Zhangchen and Jiang, Fengqing and Niu, Luyao and Jia, Jinyuan and Lin, Bill Yuchen and Poovendran, Radha},\n\tbooktitle={62nd Annual Meeting of the Association for Computational Linguistics (ACL)},\n\tyear={2024},\n\taddendum = {\\textcolor{blue}{Oral}}\n}\n\n\n","author_short":["Xu, Z.","Jiang, F.","Niu, L.","Jia, J.","Lin, B. Y.","Poovendran, R."],"key":"xu2024safedecoding","id":"xu2024safedecoding","bibbaseid":"xu-jiang-niu-jia-lin-poovendran-safedecodingdefendingagainstjailbreakattacksviasafetyawaredecoding-2024","role":"author","urls":{},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://raw.githubusercontent.com/luyaoniu/luyaoniu.github.io/master/mybib.bib","dataSources":["YcYEQEQwKynzxML7W"],"keywords":[],"search_terms":["safedecoding","defending","against","jailbreak","attacks","via","safety","aware","decoding","xu","jiang","niu","jia","lin","poovendran"],"title":"SafeDecoding: Defending against Jailbreak Attacks via Safety-Aware Decoding","year":2024}