Eureka: Human-Level Reward Design via Coding Large Language Models. Ma, Y. J., Liang, W., Wang, G., Huang, D., Bastani, O., Jayaraman, D., Zhu, Y., Fan, L., & Anandkumar, A. ICLR, 2024.
bibtex   
@article{ma2024eureka,
      title={Eureka: Human-Level Reward Design via Coding Large Language Models}, 
      author={Yecheng Jason Ma and William Liang and Guanzhi Wang and De-An Huang and Osbert Bastani and Dinesh Jayaraman and Yuke Zhu and Linxi Fan and Anima Anandkumar},
      year={2024},
      journal={ICLR}
}

Downloads: 0