Playing Atari with Deep Reinforcement Learning. Mnih, V., Kavukcuoglu, K., Silver, D., Graves, A., Antonoglou, I., Wierstra, D., & Riedmiller, M. arXiv:1312.5602 [cs], December, 2013. arXiv: 1312.5602
Paper abstract bibtex We present the first deep learning model to successfully learn control policies directly from high-dimensional sensory input using reinforcement learning. The model is a convolutional neural network, trained with a variant of Q-learning, whose input is raw pixels and whose output is a value function estimating future rewards. We apply our method to seven Atari 2600 games from the Arcade Learning Environment, with no adjustment of the architecture or learning algorithm. We find that it outperforms all previous approaches on six of the games and surpasses a human expert on three of them.
@article{mnih_playing_2013,
title = {Playing {Atari} with {Deep} {Reinforcement} {Learning}},
url = {http://arxiv.org/abs/1312.5602},
abstract = {We present the first deep learning model to successfully learn control policies directly from high-dimensional sensory input using reinforcement learning. The model is a convolutional neural network, trained with a variant of Q-learning, whose input is raw pixels and whose output is a value function estimating future rewards. We apply our method to seven Atari 2600 games from the Arcade Learning Environment, with no adjustment of the architecture or learning algorithm. We find that it outperforms all previous approaches on six of the games and surpasses a human expert on three of them.},
urldate = {2019-05-14},
journal = {arXiv:1312.5602 [cs]},
author = {Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Graves, Alex and Antonoglou, Ioannis and Wierstra, Daan and Riedmiller, Martin},
month = dec,
year = {2013},
note = {arXiv: 1312.5602},
keywords = {Computer Science - Machine Learning},
}
Downloads: 0
{"_id":"63Ja2naMgQjBKqpoM","bibbaseid":"mnih-kavukcuoglu-silver-graves-antonoglou-wierstra-riedmiller-playingatariwithdeepreinforcementlearning-2013","downloads":0,"creationDate":"2019-01-26T05:02:40.432Z","title":"Playing Atari with Deep Reinforcement Learning","author_short":["Mnih, V.","Kavukcuoglu, K.","Silver, D.","Graves, A.","Antonoglou, I.","Wierstra, D.","Riedmiller, M."],"year":2013,"bibtype":"article","biburl":"https://bibbase.org/zotero/pab2163","bibdata":{"bibtype":"article","type":"article","title":"Playing Atari with Deep Reinforcement Learning","url":"http://arxiv.org/abs/1312.5602","abstract":"We present the first deep learning model to successfully learn control policies directly from high-dimensional sensory input using reinforcement learning. The model is a convolutional neural network, trained with a variant of Q-learning, whose input is raw pixels and whose output is a value function estimating future rewards. We apply our method to seven Atari 2600 games from the Arcade Learning Environment, with no adjustment of the architecture or learning algorithm. We find that it outperforms all previous approaches on six of the games and surpasses a human expert on three of them.","urldate":"2019-05-14","journal":"arXiv:1312.5602 [cs]","author":[{"propositions":[],"lastnames":["Mnih"],"firstnames":["Volodymyr"],"suffixes":[]},{"propositions":[],"lastnames":["Kavukcuoglu"],"firstnames":["Koray"],"suffixes":[]},{"propositions":[],"lastnames":["Silver"],"firstnames":["David"],"suffixes":[]},{"propositions":[],"lastnames":["Graves"],"firstnames":["Alex"],"suffixes":[]},{"propositions":[],"lastnames":["Antonoglou"],"firstnames":["Ioannis"],"suffixes":[]},{"propositions":[],"lastnames":["Wierstra"],"firstnames":["Daan"],"suffixes":[]},{"propositions":[],"lastnames":["Riedmiller"],"firstnames":["Martin"],"suffixes":[]}],"month":"December","year":"2013","note":"arXiv: 1312.5602","keywords":"Computer Science - Machine Learning","bibtex":"@article{mnih_playing_2013,\n\ttitle = {Playing {Atari} with {Deep} {Reinforcement} {Learning}},\n\turl = {http://arxiv.org/abs/1312.5602},\n\tabstract = {We present the first deep learning model to successfully learn control policies directly from high-dimensional sensory input using reinforcement learning. The model is a convolutional neural network, trained with a variant of Q-learning, whose input is raw pixels and whose output is a value function estimating future rewards. We apply our method to seven Atari 2600 games from the Arcade Learning Environment, with no adjustment of the architecture or learning algorithm. We find that it outperforms all previous approaches on six of the games and surpasses a human expert on three of them.},\n\turldate = {2019-05-14},\n\tjournal = {arXiv:1312.5602 [cs]},\n\tauthor = {Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Graves, Alex and Antonoglou, Ioannis and Wierstra, Daan and Riedmiller, Martin},\n\tmonth = dec,\n\tyear = {2013},\n\tnote = {arXiv: 1312.5602},\n\tkeywords = {Computer Science - Machine Learning},\n}\n\n\n\n\n\n\n\n\n\n\n\n","author_short":["Mnih, V.","Kavukcuoglu, K.","Silver, D.","Graves, A.","Antonoglou, I.","Wierstra, D.","Riedmiller, M."],"key":"mnih_playing_2013","id":"mnih_playing_2013","bibbaseid":"mnih-kavukcuoglu-silver-graves-antonoglou-wierstra-riedmiller-playingatariwithdeepreinforcementlearning-2013","role":"author","urls":{"Paper":"http://arxiv.org/abs/1312.5602"},"keyword":["Computer Science - Machine Learning"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"search_terms":["playing","atari","deep","reinforcement","learning","mnih","kavukcuoglu","silver","graves","antonoglou","wierstra","riedmiller"],"keywords":["computer science - machine learning"],"authorIDs":[],"dataSources":["hEoKh4ygEAWbAZ5iy","XFrKPG99s5t3W7xuW","CmHEoydhafhbkXXt5","Wsv2bQ4jPuc7qme8R","cx4WvnDhXJhiLqdQo","fB4GuzdCZcPR6LeBn"]}