GTBench: Uncovering the Strategic Reasoning Limitations of LLMs via Game-Theoretic Evaluations. Duan, J., Zhang, R., Diffenderfer, J., Kailkhura, B., Sun, L., Stengel-Eskin, E., Bansal, M., Chen, T., & Xu, K. CoRR, 2024.
GTBench: Uncovering the Strategic Reasoning Limitations of LLMs via Game-Theoretic Evaluations. [link]Link  GTBench: Uncovering the Strategic Reasoning Limitations of LLMs via Game-Theoretic Evaluations. [link]Paper  bibtex   
@article{journals/corr/abs-2402-12348,
  added-at = {2025-09-06T00:00:00.000+0200},
  author = {Duan, Jinhao and Zhang, Renming and Diffenderfer, James and Kailkhura, Bhavya and Sun, Lichao and Stengel-Eskin, Elias and Bansal, Mohit and Chen, Tianlong and Xu, Kaidi},
  biburl = {https://www.bibsonomy.org/bibtex/237eeb10fc103e0cabffc23e26b9750ab/dblp},
  ee = {https://doi.org/10.48550/arXiv.2402.12348},
  interhash = {2684bb150f0c3efcd24f5fdb074b23cc},
  intrahash = {37eeb10fc103e0cabffc23e26b9750ab},
  journal = {CoRR},
  keywords = {dblp},
  timestamp = {2025-09-15T07:28:47.000+0200},
  title = {GTBench: Uncovering the Strategic Reasoning Limitations of LLMs via Game-Theoretic Evaluations.},
  url = {http://dblp.uni-trier.de/db/journals/corr/corr2402.html#abs-2402-12348},
  volume = {abs/2402.12348},
  year = 2024
}

Downloads: 0