Online Learning in Markov Decision Processes with Adversarially Chosen Transition Probability Distributions. Abbasi-Yadkori, Y., Bartlett, P. L., & Szepesvári, C. CoRR, 2013. Paper bibtex @article{DBLP:journals/corr/abs-1303-3055,
author = {Yasin Abbasi{-}Yadkori and
Peter L. Bartlett and
Csaba Szepesv{\'{a}}ri},
title = {Online Learning in Markov Decision Processes with Adversarially Chosen
Transition Probability Distributions},
journal = {CoRR},
volume = {abs/1303.3055},
year = {2013},
url = {http://arxiv.org/abs/1303.3055},
archivePrefix = {arXiv},
eprint = {1303.3055},
timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-1303-3055.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"usdey8rbZY9oDiGor","bibbaseid":"abbasiyadkori-bartlett-szepesvri-onlinelearninginmarkovdecisionprocesseswithadversariallychosentransitionprobabilitydistributions-2013","author_short":["Abbasi-Yadkori, Y.","Bartlett, P. L.","Szepesvári, C."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Yasin"],"propositions":[],"lastnames":["Abbasi-Yadkori"],"suffixes":[]},{"firstnames":["Peter","L."],"propositions":[],"lastnames":["Bartlett"],"suffixes":[]},{"firstnames":["Csaba"],"propositions":[],"lastnames":["Szepesvári"],"suffixes":[]}],"title":"Online Learning in Markov Decision Processes with Adversarially Chosen Transition Probability Distributions","journal":"CoRR","volume":"abs/1303.3055","year":"2013","url":"http://arxiv.org/abs/1303.3055","archiveprefix":"arXiv","eprint":"1303.3055","timestamp":"Mon, 13 Aug 2018 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-1303-3055.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-1303-3055,\n author = {Yasin Abbasi{-}Yadkori and\n Peter L. Bartlett and\n Csaba Szepesv{\\'{a}}ri},\n title = {Online Learning in Markov Decision Processes with Adversarially Chosen\n Transition Probability Distributions},\n journal = {CoRR},\n volume = {abs/1303.3055},\n year = {2013},\n url = {http://arxiv.org/abs/1303.3055},\n archivePrefix = {arXiv},\n eprint = {1303.3055},\n timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-1303-3055.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Abbasi-Yadkori, Y.","Bartlett, P. L.","Szepesvári, C."],"key":"DBLP:journals/corr/abs-1303-3055","id":"DBLP:journals/corr/abs-1303-3055","bibbaseid":"abbasiyadkori-bartlett-szepesvri-onlinelearninginmarkovdecisionprocesseswithadversariallychosentransitionprobabilitydistributions-2013","role":"author","urls":{"Paper":"http://arxiv.org/abs/1303.3055"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://sites.ualberta.ca/~szepesva/papers/567.bib","dataSources":["cd5AYQRw3RHjTgoQc"],"keywords":[],"search_terms":["online","learning","markov","decision","processes","adversarially","chosen","transition","probability","distributions","abbasi-yadkori","bartlett","szepesvári"],"title":"Online Learning in Markov Decision Processes with Adversarially Chosen Transition Probability Distributions","year":2013}