clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents. Beyer, A., Chalamalasetti, K., Hakimov, S., Madureira, B., Sadler, P., & Schlangen, D. 2024. bibtex @misc{Beyer-2024,
title = {clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents},
author = {Beyer, Anne and Chalamalasetti, Kranti and Hakimov, Sherzod and Madureira, Brielen and Sadler, Philipp and Schlangen, David},
year = {2024},
eprint = {2405.20859},
archiveprefix = {arXiv},
primaryclass = {cs.CL}
}
Downloads: 0
{"_id":"oiE7Ly6jKfXzggQMA","bibbaseid":"beyer-chalamalasetti-hakimov-madureira-sadler-schlangen-clembench2024achallengingdynamiccomplementarymultilingualbenchmarkandunderlyingflexibleframeworkforllmsasmultiactionagents-2024","author_short":["Beyer, A.","Chalamalasetti, K.","Hakimov, S.","Madureira, B.","Sadler, P.","Schlangen, D."],"bibdata":{"bibtype":"misc","type":"misc","title":"clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents","author":[{"propositions":[],"lastnames":["Beyer"],"firstnames":["Anne"],"suffixes":[]},{"propositions":[],"lastnames":["Chalamalasetti"],"firstnames":["Kranti"],"suffixes":[]},{"propositions":[],"lastnames":["Hakimov"],"firstnames":["Sherzod"],"suffixes":[]},{"propositions":[],"lastnames":["Madureira"],"firstnames":["Brielen"],"suffixes":[]},{"propositions":[],"lastnames":["Sadler"],"firstnames":["Philipp"],"suffixes":[]},{"propositions":[],"lastnames":["Schlangen"],"firstnames":["David"],"suffixes":[]}],"year":"2024","eprint":"2405.20859","archiveprefix":"arXiv","primaryclass":"cs.CL","bibtex":"@misc{Beyer-2024,\n title = {clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents},\n author = {Beyer, Anne and Chalamalasetti, Kranti and Hakimov, Sherzod and Madureira, Brielen and Sadler, Philipp and Schlangen, David},\n year = {2024},\n eprint = {2405.20859},\n archiveprefix = {arXiv},\n primaryclass = {cs.CL}\n}\n","author_short":["Beyer, A.","Chalamalasetti, K.","Hakimov, S.","Madureira, B.","Sadler, P.","Schlangen, D."],"key":"Beyer-2024","id":"Beyer-2024","bibbaseid":"beyer-chalamalasetti-hakimov-madureira-sadler-schlangen-clembench2024achallengingdynamiccomplementarymultilingualbenchmarkandunderlyingflexibleframeworkforllmsasmultiactionagents-2024","role":"author","urls":{},"metadata":{"authorlinks":{}}},"bibtype":"misc","biburl":"AnneBeyer.github.io/assets/bib/mine.bib","dataSources":["vJAkHsXDgEhvMakMj"],"keywords":[],"search_terms":["clembench","2024","challenging","dynamic","complementary","multilingual","benchmark","underlying","flexible","framework","llms","multi","action","agents","beyer","chalamalasetti","hakimov","madureira","sadler","schlangen"],"title":"clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents","year":2024}