Hierarchical Reinforcement Learning with the MAXQ Value Function Decomposition. Dietterich, T. G. 13:227-303.
Paper doi bibtex @article{dietterichHierarchicalReinforcementLearning2000,
langid = {english},
title = {Hierarchical {{Reinforcement Learning}} with the {{MAXQ Value Function Decomposition}}},
volume = {13},
issn = {1076-9757},
url = {https://www.jair.org/index.php/jair/article/view/10266},
doi = {10.1613/jair.639},
journaltitle = {Journal of Artificial Intelligence Research},
shortjournal = {1},
urldate = {2019-01-21},
date = {2000-11-01},
pages = {227-303},
author = {Dietterich, T. G.},
file = {/home/dimitri/Nextcloud/Zotero/storage/7S9KX8PT/Dietterich - 2000 - Hierarchical Reinforcement Learning with the MAXQ .pdf;/home/dimitri/Nextcloud/Zotero/storage/QC75TU4I/10266.html}
}