CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution. Gu, A., Rozière, B., Leather, H., Solar-Lezama, A., Synnaeve, G., & Wang, S. I. CoRR, 2024.
Paper doi bibtex @article{DBLP:journals/corr/abs-2401-03065,
author = {Alex Gu and
Baptiste Rozi{\`{e}}re and
Hugh Leather and
Armando Solar{-}Lezama and
Gabriel Synnaeve and
Sida I. Wang},
title = {CRUXEval: {A} Benchmark for Code Reasoning, Understanding and Execution},
journal = {CoRR},
volume = {abs/2401.03065},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2401.03065},
doi = {10.48550/ARXIV.2401.03065},
eprinttype = {arXiv},
eprint = {2401.03065},
timestamp = {Wed, 24 Jan 2024 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2401-03065.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"MML2BDyCyyL6gbRoq","bibbaseid":"gu-rozire-leather-solarlezama-synnaeve-wang-cruxevalabenchmarkforcodereasoningunderstandingandexecution-2024","author_short":["Gu, A.","Rozière, B.","Leather, H.","Solar-Lezama, A.","Synnaeve, G.","Wang, S. I."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Alex"],"propositions":[],"lastnames":["Gu"],"suffixes":[]},{"firstnames":["Baptiste"],"propositions":[],"lastnames":["Rozière"],"suffixes":[]},{"firstnames":["Hugh"],"propositions":[],"lastnames":["Leather"],"suffixes":[]},{"firstnames":["Armando"],"propositions":[],"lastnames":["Solar-Lezama"],"suffixes":[]},{"firstnames":["Gabriel"],"propositions":[],"lastnames":["Synnaeve"],"suffixes":[]},{"firstnames":["Sida","I."],"propositions":[],"lastnames":["Wang"],"suffixes":[]}],"title":"CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution","journal":"CoRR","volume":"abs/2401.03065","year":"2024","url":"https://doi.org/10.48550/arXiv.2401.03065","doi":"10.48550/ARXIV.2401.03065","eprinttype":"arXiv","eprint":"2401.03065","timestamp":"Wed, 24 Jan 2024 00:00:00 +0100","biburl":"https://dblp.org/rec/journals/corr/abs-2401-03065.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2401-03065,\n author = {Alex Gu and\n Baptiste Rozi{\\`{e}}re and\n Hugh Leather and\n Armando Solar{-}Lezama and\n Gabriel Synnaeve and\n Sida I. Wang},\n title = {CRUXEval: {A} Benchmark for Code Reasoning, Understanding and Execution},\n journal = {CoRR},\n volume = {abs/2401.03065},\n year = {2024},\n url = {https://doi.org/10.48550/arXiv.2401.03065},\n doi = {10.48550/ARXIV.2401.03065},\n eprinttype = {arXiv},\n eprint = {2401.03065},\n timestamp = {Wed, 24 Jan 2024 00:00:00 +0100},\n biburl = {https://dblp.org/rec/journals/corr/abs-2401-03065.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Gu, A.","Rozière, B.","Leather, H.","Solar-Lezama, A.","Synnaeve, G.","Wang, S. I."],"key":"DBLP:journals/corr/abs-2401-03065","id":"DBLP:journals/corr/abs-2401-03065","bibbaseid":"gu-rozire-leather-solarlezama-synnaeve-wang-cruxevalabenchmarkforcodereasoningunderstandingandexecution-2024","role":"author","urls":{"Paper":"https://doi.org/10.48550/arXiv.2401.03065"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://dblp.org/pers/tb2/s/Solar=Lezama:Armando","dataSources":["rGuy4xgsrB7zfgooW","DAnxudWukpMXCtWy8"],"keywords":[],"search_terms":["cruxeval","benchmark","code","reasoning","understanding","execution","gu","rozière","leather","solar-lezama","synnaeve","wang"],"title":"CRUXEval: A Benchmark for Code Reasoning, Understanding and Execution","year":2024}