STEER-BENCH: A Benchmark for Evaluating the Steerability of Large Language Models. Chen, K., He, Z., Shi, T., & Lerman, K. CoRR, 2025.
STEER-BENCH: A Benchmark for Evaluating the Steerability of Large Language Models [link]Paper  doi  bibtex   
@article{DBLP:journals/corr/abs-2505-20645,
  author       = {Kai Chen and
                  Zihao He and
                  Taiwei Shi and
                  Kristina Lerman},
  title        = {{STEER-BENCH:} {A} Benchmark for Evaluating the Steerability of Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2505.20645},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.20645},
  doi          = {10.48550/ARXIV.2505.20645},
  eprinttype    = {arXiv},
  eprint       = {2505.20645},
  timestamp    = {Fri, 27 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-20645.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0