Hierarchical Reinforcement Learning with the MAXQ Value Function Decomposition. Dietterich, T. G. 13:227-303.
Hierarchical Reinforcement Learning with the MAXQ Value Function Decomposition [link]Paper  doi  bibtex   
@article{dietterichHierarchicalReinforcementLearning2000,
  langid = {english},
  title = {Hierarchical {{Reinforcement Learning}} with the {{MAXQ Value Function Decomposition}}},
  volume = {13},
  issn = {1076-9757},
  url = {https://www.jair.org/index.php/jair/article/view/10266},
  doi = {10.1613/jair.639},
  journaltitle = {Journal of Artificial Intelligence Research},
  shortjournal = {1},
  urldate = {2019-01-21},
  date = {2000-11-01},
  pages = {227-303},
  author = {Dietterich, T. G.},
  file = {/home/dimitri/Nextcloud/Zotero/storage/7S9KX8PT/Dietterich - 2000 - Hierarchical Reinforcement Learning with the MAXQ .pdf;/home/dimitri/Nextcloud/Zotero/storage/QC75TU4I/10266.html}
}

Downloads: 0