Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep Reinforcement Learning

Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep Reinforcement Learning. Sharma, S., J, G. R., Ramesh, S., & Ravindran, B. CoRR, 2017.

Paper bibtex

@article{DBLP:journals/corr/SharmaRJR17,
  author    = {Sahil Sharma and
               Girish Raguvir J and
               Srivatsan Ramesh and
               Balaraman Ravindran},
  title     = {Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep
               Reinforcement Learning},
  journal   = {CoRR},
  volume    = {abs/1705.07445},
  year      = {2017},
  url       = {http://arxiv.org/abs/1705.07445},
  archivePrefix = {arXiv},
  eprint    = {1705.07445},
  timestamp = {Fri, 10 Nov 2017 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/SharmaRJR17},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0

{"_id":"jyNsBsRkr8SSd9tr7","bibbaseid":"sharma-j-ramesh-ravindran-learningtomixnstepreturnsgeneralizinglambdareturnsfordeepreinforcementlearning-2017","downloads":0,"creationDate":"2018-07-05T07:18:52.416Z","title":"Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep Reinforcement Learning","author_short":["Sharma, S.","J, G. R.","Ramesh, S.","Ravindran, B."],"year":2017,"bibtype":"article","biburl":"https://dblp.org/pid/69/2281.bib","bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Sahil"],"propositions":[],"lastnames":["Sharma"],"suffixes":[]},{"firstnames":["Girish","Raguvir"],"propositions":[],"lastnames":["J"],"suffixes":[]},{"firstnames":["Srivatsan"],"propositions":[],"lastnames":["Ramesh"],"suffixes":[]},{"firstnames":["Balaraman"],"propositions":[],"lastnames":["Ravindran"],"suffixes":[]}],"title":"Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep Reinforcement Learning","journal":"CoRR","volume":"abs/1705.07445","year":"2017","url":"http://arxiv.org/abs/1705.07445","archiveprefix":"arXiv","eprint":"1705.07445","timestamp":"Fri, 10 Nov 2017 00:00:00 +0100","biburl":"https://dblp.org/rec/bib/journals/corr/SharmaRJR17","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/SharmaRJR17,\n author = {Sahil Sharma and\n Girish Raguvir J and\n Srivatsan Ramesh and\n Balaraman Ravindran},\n title = {Learning to Mix n-Step Returns: Generalizing lambda-Returns for Deep\n Reinforcement Learning},\n journal = {CoRR},\n volume = {abs/1705.07445},\n year = {2017},\n url = {http://arxiv.org/abs/1705.07445},\n archivePrefix = {arXiv},\n eprint = {1705.07445},\n timestamp = {Fri, 10 Nov 2017 00:00:00 +0100},\n biburl = {https://dblp.org/rec/bib/journals/corr/SharmaRJR17},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Sharma, S.","J, G. R.","Ramesh, S.","Ravindran, B."],"key":"DBLP:journals/corr/SharmaRJR17","id":"DBLP:journals/corr/SharmaRJR17","bibbaseid":"sharma-j-ramesh-ravindran-learningtomixnstepreturnsgeneralizinglambdareturnsfordeepreinforcementlearning-2017","role":"author","urls":{"Paper":"http://arxiv.org/abs/1705.07445"},"downloads":0},"search_terms":["learning","mix","step","returns","generalizing","lambda","returns","deep","reinforcement","learning","sharma","j","ramesh","ravindran"],"keywords":[],"authorIDs":[],"dataSources":["h4b7adP45ppx3WFf8"]}