Robust Reward Modeling via Causal Rubrics. Srivastava, P., Singh, H., Madhavan, R., Patil, G., Addepalli, S., Suggala, A. S., Aravamudhan, R., Sharma, S., Laha, A., Raghuveer, A., Shanmugam, K., & Precup, D. CoRR, 06, 2025.
Link
Paper bibtex @article{journals/corr/abs-2506-16507,
added-at = {2025-07-11T00:00:00.000+0200},
author = {Srivastava, Pragya and Singh, Harman and Madhavan, Rahul and Patil, Gandharv and Addepalli, Sravanti and Suggala, Arun Sai and Aravamudhan, Rengarajan and Sharma, Soumya and Laha, Anirban and Raghuveer, Aravindan and Shanmugam, Karthikeyan and Precup, Doina},
biburl = {https://www.bibsonomy.org/bibtex/2ea7fca8194f9c74e24a1b4e424157f77/dblp},
ee = {https://doi.org/10.48550/arXiv.2506.16507},
interhash = {7cbce6a252b133fb78dd5f96fbfc5313},
intrahash = {ea7fca8194f9c74e24a1b4e424157f77},
journal = {CoRR},
keywords = {dblp},
month = {06},
timestamp = {2025-07-14T07:06:35.000+0200},
title = {Robust Reward Modeling via Causal Rubrics.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2506.html#abs-2506-16507},
volume = {abs/2506.16507},
year = 2025
}
Downloads: 0
{"_id":"L8BP8MTxiLX6rmgH5","bibbaseid":"srivastava-singh-madhavan-patil-addepalli-suggala-aravamudhan-sharma-etal-robustrewardmodelingviacausalrubrics-2025","author_short":["Srivastava, P.","Singh, H.","Madhavan, R.","Patil, G.","Addepalli, S.","Suggala, A. S.","Aravamudhan, R.","Sharma, S.","Laha, A.","Raghuveer, A.","Shanmugam, K.","Precup, D."],"bibdata":{"bibtype":"article","type":"article","added-at":"2025-07-11T00:00:00.000+0200","author":[{"propositions":[],"lastnames":["Srivastava"],"firstnames":["Pragya"],"suffixes":[]},{"propositions":[],"lastnames":["Singh"],"firstnames":["Harman"],"suffixes":[]},{"propositions":[],"lastnames":["Madhavan"],"firstnames":["Rahul"],"suffixes":[]},{"propositions":[],"lastnames":["Patil"],"firstnames":["Gandharv"],"suffixes":[]},{"propositions":[],"lastnames":["Addepalli"],"firstnames":["Sravanti"],"suffixes":[]},{"propositions":[],"lastnames":["Suggala"],"firstnames":["Arun","Sai"],"suffixes":[]},{"propositions":[],"lastnames":["Aravamudhan"],"firstnames":["Rengarajan"],"suffixes":[]},{"propositions":[],"lastnames":["Sharma"],"firstnames":["Soumya"],"suffixes":[]},{"propositions":[],"lastnames":["Laha"],"firstnames":["Anirban"],"suffixes":[]},{"propositions":[],"lastnames":["Raghuveer"],"firstnames":["Aravindan"],"suffixes":[]},{"propositions":[],"lastnames":["Shanmugam"],"firstnames":["Karthikeyan"],"suffixes":[]},{"propositions":[],"lastnames":["Precup"],"firstnames":["Doina"],"suffixes":[]}],"biburl":"https://www.bibsonomy.org/bibtex/2ea7fca8194f9c74e24a1b4e424157f77/dblp","ee":"https://doi.org/10.48550/arXiv.2506.16507","interhash":"7cbce6a252b133fb78dd5f96fbfc5313","intrahash":"ea7fca8194f9c74e24a1b4e424157f77","journal":"CoRR","keywords":"dblp","month":"06","timestamp":"2025-07-14T07:06:35.000+0200","title":"Robust Reward Modeling via Causal Rubrics.","url":"http://dblp.uni-trier.de/db/journals/corr/corr2506.html#abs-2506-16507","volume":"abs/2506.16507","year":"2025","bibtex":"@article{journals/corr/abs-2506-16507,\n added-at = {2025-07-11T00:00:00.000+0200},\n author = {Srivastava, Pragya and Singh, Harman and Madhavan, Rahul and Patil, Gandharv and Addepalli, Sravanti and Suggala, Arun Sai and Aravamudhan, Rengarajan and Sharma, Soumya and Laha, Anirban and Raghuveer, Aravindan and Shanmugam, Karthikeyan and Precup, Doina},\n biburl = {https://www.bibsonomy.org/bibtex/2ea7fca8194f9c74e24a1b4e424157f77/dblp},\n ee = {https://doi.org/10.48550/arXiv.2506.16507},\n interhash = {7cbce6a252b133fb78dd5f96fbfc5313},\n intrahash = {ea7fca8194f9c74e24a1b4e424157f77},\n journal = {CoRR},\n keywords = {dblp},\n month = {06},\n timestamp = {2025-07-14T07:06:35.000+0200},\n title = {Robust Reward Modeling via Causal Rubrics.},\n url = {http://dblp.uni-trier.de/db/journals/corr/corr2506.html#abs-2506-16507},\n volume = {abs/2506.16507},\n year = 2025\n}\n\n","author_short":["Srivastava, P.","Singh, H.","Madhavan, R.","Patil, G.","Addepalli, S.","Suggala, A. S.","Aravamudhan, R.","Sharma, S.","Laha, A.","Raghuveer, A.","Shanmugam, K.","Precup, D."],"key":"journals/corr/abs-2506-16507","id":"journals/corr/abs-2506-16507","bibbaseid":"srivastava-singh-madhavan-patil-addepalli-suggala-aravamudhan-sharma-etal-robustrewardmodelingviacausalrubrics-2025","role":"author","urls":{"Link":"https://doi.org/10.48550/arXiv.2506.16507","Paper":"http://dblp.uni-trier.de/db/journals/corr/corr2506.html#abs-2506-16507"},"keyword":["dblp"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"bibtype":"article","biburl":"http://www.bibsonomy.org/bib/author/rahul ?items=1000","dataSources":["JwYijr7YMA4Gkd5HT"],"keywords":["dblp"],"search_terms":["robust","reward","modeling","via","causal","rubrics","srivastava","singh","madhavan","patil","addepalli","suggala","aravamudhan","sharma","laha","raghuveer","shanmugam","precup"],"title":"Robust Reward Modeling via Causal Rubrics.","year":2025}