Robust Reward Modeling via Causal Rubrics. Srivastava, P., Singh, H., Madhavan, R., Patil, G., Addepalli, S., Suggala, A. S., Aravamudhan, R., Sharma, S., Laha, A., Raghuveer, A., Shanmugam, K., & Precup, D. CoRR, 06, 2025.
Robust Reward Modeling via Causal Rubrics. [link]Link  Robust Reward Modeling via Causal Rubrics. [link]Paper  bibtex   
@article{journals/corr/abs-2506-16507,
  added-at = {2025-07-11T00:00:00.000+0200},
  author = {Srivastava, Pragya and Singh, Harman and Madhavan, Rahul and Patil, Gandharv and Addepalli, Sravanti and Suggala, Arun Sai and Aravamudhan, Rengarajan and Sharma, Soumya and Laha, Anirban and Raghuveer, Aravindan and Shanmugam, Karthikeyan and Precup, Doina},
  biburl = {https://www.bibsonomy.org/bibtex/2ea7fca8194f9c74e24a1b4e424157f77/dblp},
  ee = {https://doi.org/10.48550/arXiv.2506.16507},
  interhash = {7cbce6a252b133fb78dd5f96fbfc5313},
  intrahash = {ea7fca8194f9c74e24a1b4e424157f77},
  journal = {CoRR},
  keywords = {dblp},
  month = {06},
  timestamp = {2025-07-14T07:06:35.000+0200},
  title = {Robust Reward Modeling via Causal Rubrics.},
  url = {http://dblp.uni-trier.de/db/journals/corr/corr2506.html#abs-2506-16507},
  volume = {abs/2506.16507},
  year = 2025
}

Downloads: 0