Does Context Matter? ContextualJudgeBench for Evaluating LLM-based Judges in Contextual Settings. Xu, A., Bansal, S., Ming, Y., Yavuz, S., & Joty, S. CoRR, 03, 2025.
Link
Paper bibtex @article{journals/corr/abs-2503-15620,
added-at = {2025-04-14T00:00:00.000+0200},
author = {Xu, Austin and Bansal, Srijan and Ming, Yifei and Yavuz, Semih and Joty, Shafiq},
biburl = {https://www.bibsonomy.org/bibtex/259acb943eeccb80f5df177ca96060463/dblp},
ee = {https://doi.org/10.48550/arXiv.2503.15620},
interhash = {00ffcb0129f293531f29836ce954200c},
intrahash = {59acb943eeccb80f5df177ca96060463},
journal = {CoRR},
keywords = {dblp},
month = {03},
timestamp = {2025-04-21T07:07:37.000+0200},
title = {Does Context Matter? ContextualJudgeBench for Evaluating LLM-based Judges in Contextual Settings.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2503.html#abs-2503-15620},
volume = {abs/2503.15620},
year = 2025
}
Downloads: 0
{"_id":"Mdw7tpoBeCiyiRiWP","bibbaseid":"xu-bansal-ming-yavuz-joty-doescontextmattercontextualjudgebenchforevaluatingllmbasedjudgesincontextualsettings-2025","author_short":["Xu, A.","Bansal, S.","Ming, Y.","Yavuz, S.","Joty, S."],"bibdata":{"bibtype":"article","type":"article","added-at":"2025-04-14T00:00:00.000+0200","author":[{"propositions":[],"lastnames":["Xu"],"firstnames":["Austin"],"suffixes":[]},{"propositions":[],"lastnames":["Bansal"],"firstnames":["Srijan"],"suffixes":[]},{"propositions":[],"lastnames":["Ming"],"firstnames":["Yifei"],"suffixes":[]},{"propositions":[],"lastnames":["Yavuz"],"firstnames":["Semih"],"suffixes":[]},{"propositions":[],"lastnames":["Joty"],"firstnames":["Shafiq"],"suffixes":[]}],"biburl":"https://www.bibsonomy.org/bibtex/259acb943eeccb80f5df177ca96060463/dblp","ee":"https://doi.org/10.48550/arXiv.2503.15620","interhash":"00ffcb0129f293531f29836ce954200c","intrahash":"59acb943eeccb80f5df177ca96060463","journal":"CoRR","keywords":"dblp","month":"03","timestamp":"2025-04-21T07:07:37.000+0200","title":"Does Context Matter? ContextualJudgeBench for Evaluating LLM-based Judges in Contextual Settings.","url":"http://dblp.uni-trier.de/db/journals/corr/corr2503.html#abs-2503-15620","volume":"abs/2503.15620","year":"2025","bibtex":"@article{journals/corr/abs-2503-15620,\n added-at = {2025-04-14T00:00:00.000+0200},\n author = {Xu, Austin and Bansal, Srijan and Ming, Yifei and Yavuz, Semih and Joty, Shafiq},\n biburl = {https://www.bibsonomy.org/bibtex/259acb943eeccb80f5df177ca96060463/dblp},\n ee = {https://doi.org/10.48550/arXiv.2503.15620},\n interhash = {00ffcb0129f293531f29836ce954200c},\n intrahash = {59acb943eeccb80f5df177ca96060463},\n journal = {CoRR},\n keywords = {dblp},\n month = {03},\n timestamp = {2025-04-21T07:07:37.000+0200},\n title = {Does Context Matter? ContextualJudgeBench for Evaluating LLM-based Judges in Contextual Settings.},\n url = {http://dblp.uni-trier.de/db/journals/corr/corr2503.html#abs-2503-15620},\n volume = {abs/2503.15620},\n year = 2025\n}\n\n","author_short":["Xu, A.","Bansal, S.","Ming, Y.","Yavuz, S.","Joty, S."],"key":"journals/corr/abs-2503-15620","id":"journals/corr/abs-2503-15620","bibbaseid":"xu-bansal-ming-yavuz-joty-doescontextmattercontextualjudgebenchforevaluatingllmbasedjudgesincontextualsettings-2025","role":"author","urls":{"Link":"https://doi.org/10.48550/arXiv.2503.15620","Paper":"http://dblp.uni-trier.de/db/journals/corr/corr2503.html#abs-2503-15620"},"keyword":["dblp"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"bibtype":"article","biburl":"http://www.bibsonomy.org/bib/author/Bansal?items=1000","dataSources":["QPenDByDoYqTm9vaT"],"keywords":["dblp"],"search_terms":["context","matter","contextualjudgebench","evaluating","llm","based","judges","contextual","settings","xu","bansal","ming","yavuz","joty"],"title":"Does Context Matter? ContextualJudgeBench for Evaluating LLM-based Judges in Contextual Settings.","year":2025}