Sample-efficient Nonstationary Policy Evaluation for Contextual Bandits. Dudík, M., Erhan, D., Langford, J., & Li, L. In Proceedings of Uncertainty in Artificial Intelligence (UAI), pages 247-254, 2012.
Paper bibtex @inproceedings{ dblp2555701,
title = {Sample-efficient Nonstationary Policy Evaluation for Contextual Bandits},
author = {Miroslav Dudík and Dumitru Erhan and John Langford and Lihong Li},
author_short = {Dudík, M. and Erhan, D. and Langford, J. and Li, L.},
bibtype = {inproceedings},
type = {inproceedings},
year = {2012},
key = {dblp2555701},
id = {dblp2555701},
biburl = {http://www.dblp.org/rec/bibtex/conf/uai/DudikELL12},
url = {http://dblp.uni-trier.de/https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1&smnu=2&article_id=2287&proceeding_id=28},
conference = {UAI},
pages = {247-254},
text = {UAI 2012:247-254},
booktitle = {Proceedings of Uncertainty in Artificial Intelligence (UAI)}
}
Downloads: 0
{"_id":"L3AB7Y7nxYa9cjSS3","bibbaseid":"dudk-erhan-langford-li-sampleefficientnonstationarypolicyevaluationforcontextualbandits-2012","downloads":0,"creationDate":"2015-12-14T04:14:19.911Z","title":"Sample-efficient Nonstationary Policy Evaluation for Contextual Bandits","author_short":["Dudík, M.","Erhan, D.","Langford, J.","Li, L."],"year":2012,"bibtype":"inproceedings","biburl":"http://www.dblp.org/rec/bibtex/conf/uai/DudikELL12","bibdata":{"title":"Sample-efficient Nonstationary Policy Evaluation for Contextual Bandits","author":["Miroslav Dudík","Dumitru Erhan","John Langford","Lihong Li"],"author_short":["Dudík, M.","Erhan, D.","Langford, J.","Li, L."],"bibtype":"inproceedings","type":"inproceedings","year":"2012","key":"dblp2555701","id":"dblp2555701","biburl":"http://www.dblp.org/rec/bibtex/conf/uai/DudikELL12","url":"http://dblp.uni-trier.de/https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1&smnu=2&article_id=2287&proceeding_id=28","conference":"UAI","pages":"247-254","text":"UAI 2012:247-254","booktitle":"Proceedings of Uncertainty in Artificial Intelligence (UAI)","bibtex":"@inproceedings{ dblp2555701,\n title = {Sample-efficient Nonstationary Policy Evaluation for Contextual Bandits},\n author = {Miroslav Dudík and Dumitru Erhan and John Langford and Lihong Li},\n author_short = {Dudík, M. and Erhan, D. and Langford, J. and Li, L.},\n bibtype = {inproceedings},\n type = {inproceedings},\n year = {2012},\n key = {dblp2555701},\n id = {dblp2555701},\n biburl = {http://www.dblp.org/rec/bibtex/conf/uai/DudikELL12},\n url = {http://dblp.uni-trier.de/https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1&smnu=2&article_id=2287&proceeding_id=28},\n conference = {UAI},\n pages = {247-254},\n text = {UAI 2012:247-254},\n booktitle = {Proceedings of Uncertainty in Artificial Intelligence (UAI)}\n}","bibbaseid":"dudk-erhan-langford-li-sampleefficientnonstationarypolicyevaluationforcontextualbandits-2012","role":"author","urls":{"Paper":"http://dblp.uni-trier.de/https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1&smnu=2&article_id=2287&proceeding_id=28"},"downloads":0,"html":""},"search_terms":["sample","efficient","nonstationary","policy","evaluation","contextual","bandits","dudík","erhan","langford","li"],"keywords":[],"authorIDs":[],"dataSources":["HzQNuaSsY9SPRfGwu"]}