Learning the variance of the reward-to-go. Tamar, A., Di Castro, D., & Mannor, S. Journal of Machine Learning Research, 17(13):1–36, 2016.
bibtex   
@article{tamar2016learning,
  title={Learning the variance of the reward-to-go},
  author={Tamar, Aviv and Di Castro, Dotan and Mannor, Shie},
  journal={Journal of Machine Learning Research},
  volume={17},
  number={13},
  pages={1--36},
  year={2016}
}

Downloads: 0