clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents. Beyer, A., Chalamalasetti, K., Hakimov, S., Madureira, B., Sadler, P., & Schlangen, D. 2024.
bibtex   
@misc{Beyer-2024,
  title = {clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents},
  author = {Beyer, Anne and Chalamalasetti, Kranti and Hakimov, Sherzod and Madureira, Brielen and Sadler, Philipp and Schlangen, David},
  year = {2024},
  eprint = {2405.20859},
  archiveprefix = {arXiv},
  primaryclass = {cs.CL}
}

Downloads: 0