CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution

CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution. Gu, A., Rozière, B., Leather, H. J., Solar-Lezama, A., Synnaeve, G., & Wang, S. In Forty-first International Conference on Machine Learning, ICML 2024, Vienna, Austria, July 21-27, 2024, pages 16568–16621, 2024.

Paper bibtex

@inproceedings{DBLP:conf/icml/GuRLSS024,
  author       = {Alex Gu and
                  Baptiste Rozi{\`{e}}re and
                  Hugh James Leather and
                  Armando Solar{-}Lezama and
                  Gabriel Synnaeve and
                  Sida Wang},
  title        = {CRUXEval: {A} Benchmark for Code Reasoning, Understanding and Execution},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  pages        = {16568--16621},
  year         = {2024},
  crossref     = {DBLP:conf/icml/2024},
  url          = {https://proceedings.mlr.press/v235/gu24c.html},
  timestamp    = {Mon, 09 Feb 2026 15:35:36 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/GuRLSS024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0

{"_id":"MML2BDyCyyL6gbRoq","bibbaseid":"gu-rozire-leather-solarlezama-synnaeve-wang-cruxevalabenchmarkforcodereasoningunderstandingandexecution-2024","author_short":["Gu, A.","Rozière, B.","Leather, H. J.","Solar-Lezama, A.","Synnaeve, G.","Wang, S."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Alex"],"propositions":[],"lastnames":["Gu"],"suffixes":[]},{"firstnames":["Baptiste"],"propositions":[],"lastnames":["Rozière"],"suffixes":[]},{"firstnames":["Hugh","James"],"propositions":[],"lastnames":["Leather"],"suffixes":[]},{"firstnames":["Armando"],"propositions":[],"lastnames":["Solar-Lezama"],"suffixes":[]},{"firstnames":["Gabriel"],"propositions":[],"lastnames":["Synnaeve"],"suffixes":[]},{"firstnames":["Sida"],"propositions":[],"lastnames":["Wang"],"suffixes":[]}],"title":"CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution","booktitle":"Forty-first International Conference on Machine Learning, ICML 2024, Vienna, Austria, July 21-27, 2024","pages":"16568–16621","year":"2024","crossref":"DBLP:conf/icml/2024","url":"https://proceedings.mlr.press/v235/gu24c.html","timestamp":"Mon, 09 Feb 2026 15:35:36 +0100","biburl":"https://dblp.org/rec/conf/icml/GuRLSS024.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@inproceedings{DBLP:conf/icml/GuRLSS024,\n author = {Alex Gu and\n Baptiste Rozi{\\`{e}}re and\n Hugh James Leather and\n Armando Solar{-}Lezama and\n Gabriel Synnaeve and\n Sida Wang},\n title = {CRUXEval: {A} Benchmark for Code Reasoning, Understanding and Execution},\n booktitle = {Forty-first International Conference on Machine Learning, {ICML} 2024,\n Vienna, Austria, July 21-27, 2024},\n pages = {16568--16621},\n year = {2024},\n crossref = {DBLP:conf/icml/2024},\n url = {https://proceedings.mlr.press/v235/gu24c.html},\n timestamp = {Mon, 09 Feb 2026 15:35:36 +0100},\n biburl = {https://dblp.org/rec/conf/icml/GuRLSS024.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Gu, A.","Rozière, B.","Leather, H. J.","Solar-Lezama, A.","Synnaeve, G.","Wang, S."],"key":"DBLP:conf/icml/GuRLSS024","id":"DBLP:conf/icml/GuRLSS024","bibbaseid":"gu-rozire-leather-solarlezama-synnaeve-wang-cruxevalabenchmarkforcodereasoningunderstandingandexecution-2024","role":"author","urls":{"Paper":"https://proceedings.mlr.press/v235/gu24c.html"},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"http://dblp.org/pers/tb2/s/Solar=Lezama:Armando","dataSources":["DAnxudWukpMXCtWy8"],"keywords":[],"search_terms":["cruxeval","benchmark","code","reasoning","understanding","execution","gu","rozière","leather","solar-lezama","synnaeve","wang"],"title":"CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution","year":2024}