STEER-BENCH: A Benchmark for Evaluating the Steerability of Large Language Models. Chen, K., He, Z., Shi, T., & Lerman, K. CoRR, 2025.
Paper doi bibtex @article{DBLP:journals/corr/abs-2505-20645,
author = {Kai Chen and
Zihao He and
Taiwei Shi and
Kristina Lerman},
title = {{STEER-BENCH:} {A} Benchmark for Evaluating the Steerability of Large
Language Models},
journal = {CoRR},
volume = {abs/2505.20645},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2505.20645},
doi = {10.48550/ARXIV.2505.20645},
eprinttype = {arXiv},
eprint = {2505.20645},
timestamp = {Fri, 27 Jun 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2505-20645.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"aFeG5narC3oybEMXv","bibbaseid":"chen-he-shi-lerman-steerbenchabenchmarkforevaluatingthesteerabilityoflargelanguagemodels-2025","author_short":["Chen, K.","He, Z.","Shi, T.","Lerman, K."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Kai"],"propositions":[],"lastnames":["Chen"],"suffixes":[]},{"firstnames":["Zihao"],"propositions":[],"lastnames":["He"],"suffixes":[]},{"firstnames":["Taiwei"],"propositions":[],"lastnames":["Shi"],"suffixes":[]},{"firstnames":["Kristina"],"propositions":[],"lastnames":["Lerman"],"suffixes":[]}],"title":"STEER-BENCH: A Benchmark for Evaluating the Steerability of Large Language Models","journal":"CoRR","volume":"abs/2505.20645","year":"2025","url":"https://doi.org/10.48550/arXiv.2505.20645","doi":"10.48550/ARXIV.2505.20645","eprinttype":"arXiv","eprint":"2505.20645","timestamp":"Fri, 27 Jun 2025 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-2505-20645.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2505-20645,\n author = {Kai Chen and\n Zihao He and\n Taiwei Shi and\n Kristina Lerman},\n title = {{STEER-BENCH:} {A} Benchmark for Evaluating the Steerability of Large\n Language Models},\n journal = {CoRR},\n volume = {abs/2505.20645},\n year = {2025},\n url = {https://doi.org/10.48550/arXiv.2505.20645},\n doi = {10.48550/ARXIV.2505.20645},\n eprinttype = {arXiv},\n eprint = {2505.20645},\n timestamp = {Fri, 27 Jun 2025 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-2505-20645.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Chen, K.","He, Z.","Shi, T.","Lerman, K."],"key":"DBLP:journals/corr/abs-2505-20645","id":"DBLP:journals/corr/abs-2505-20645","bibbaseid":"chen-he-shi-lerman-steerbenchabenchmarkforevaluatingthesteerabilityoflargelanguagemodels-2025","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2505.20645"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/99/433.bib","dataSources":["kxTAWhAJ5AEaGtDRP"],"keywords":[],"search_terms":["steer","bench","benchmark","evaluating","steerability","large","language","models","chen","he","shi","lerman"],"title":"STEER-BENCH: A Benchmark for Evaluating the Steerability of Large Language Models","year":2025}