Flirt: Feedback loop in-context red teaming. Mehrabi, N., Goyal, P., Dupuy, C., Hu, Q., Ghosh, S., Zemel, R., Chang, K., Galstyan, A., & Gupta, R. arXiv preprint arXiv:2308.04265, 2023. bibtex @article{mehrabi2023flirt,
title={Flirt: Feedback loop in-context red teaming},
author={Mehrabi, Ninareh and Goyal, Palash and Dupuy, Christophe and Hu, Qian and Ghosh, Shalini and Zemel, Richard and Chang, Kai-Wei and Galstyan, Aram and Gupta, Rahul},
journal={arXiv preprint arXiv:2308.04265},
year={2023}
}
Downloads: 0
{"_id":"xi3R8asZNcBsKHPL6","bibbaseid":"mehrabi-goyal-dupuy-hu-ghosh-zemel-chang-galstyan-etal-flirtfeedbackloopincontextredteaming-2023","author_short":["Mehrabi, N.","Goyal, P.","Dupuy, C.","Hu, Q.","Ghosh, S.","Zemel, R.","Chang, K.","Galstyan, A.","Gupta, R."],"bibdata":{"bibtype":"article","type":"article","title":"Flirt: Feedback loop in-context red teaming","author":[{"propositions":[],"lastnames":["Mehrabi"],"firstnames":["Ninareh"],"suffixes":[]},{"propositions":[],"lastnames":["Goyal"],"firstnames":["Palash"],"suffixes":[]},{"propositions":[],"lastnames":["Dupuy"],"firstnames":["Christophe"],"suffixes":[]},{"propositions":[],"lastnames":["Hu"],"firstnames":["Qian"],"suffixes":[]},{"propositions":[],"lastnames":["Ghosh"],"firstnames":["Shalini"],"suffixes":[]},{"propositions":[],"lastnames":["Zemel"],"firstnames":["Richard"],"suffixes":[]},{"propositions":[],"lastnames":["Chang"],"firstnames":["Kai-Wei"],"suffixes":[]},{"propositions":[],"lastnames":["Galstyan"],"firstnames":["Aram"],"suffixes":[]},{"propositions":[],"lastnames":["Gupta"],"firstnames":["Rahul"],"suffixes":[]}],"journal":"arXiv preprint arXiv:2308.04265","year":"2023","bibtex":"@article{mehrabi2023flirt,\n title={Flirt: Feedback loop in-context red teaming},\n author={Mehrabi, Ninareh and Goyal, Palash and Dupuy, Christophe and Hu, Qian and Ghosh, Shalini and Zemel, Richard and Chang, Kai-Wei and Galstyan, Aram and Gupta, Rahul},\n journal={arXiv preprint arXiv:2308.04265},\n year={2023}\n}\n\n","author_short":["Mehrabi, N.","Goyal, P.","Dupuy, C.","Hu, Q.","Ghosh, S.","Zemel, R.","Chang, K.","Galstyan, A.","Gupta, R."],"key":"mehrabi2023flirt","id":"mehrabi2023flirt","bibbaseid":"mehrabi-goyal-dupuy-hu-ghosh-zemel-chang-galstyan-etal-flirtfeedbackloopincontextredteaming-2023","role":"author","urls":{},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://bibbase.org/network/files/KAtewiFRTiuZwNvKT","dataSources":["X4cHbJwHZ9KiGTWTP","i7b6z6sWxSs3LXqnn","Su9MZR8Mrb2xFN4Rv"],"keywords":[],"search_terms":["flirt","feedback","loop","context","red","teaming","mehrabi","goyal","dupuy","hu","ghosh","zemel","chang","galstyan","gupta"],"title":"Flirt: Feedback loop in-context red teaming","year":2023}