Policy Invariance Under Reward Transformations: Theory and Application to Reward Shaping. Ng, A. Y., Harada, D., & Russell, S. J. In Proceedings of the Sixteenth International Conference on Machine Learning, of ICML '99, pages 278–287. Morgan Kaufmann Publishers Inc..
Policy Invariance Under Reward Transformations: Theory and Application to Reward Shaping [link]Paper  bibtex   
@inproceedings{ngPolicyInvarianceReward1999,
  location = {{San Francisco, CA, USA}},
  title = {Policy {{Invariance Under Reward Transformations}}: {{Theory}} and {{Application}} to {{Reward Shaping}}},
  isbn = {978-1-55860-612-8},
  url = {http://dl.acm.org/citation.cfm?id=645528.657613},
  shorttitle = {Policy {{Invariance Under Reward Transformations}}},
  booktitle = {Proceedings of the {{Sixteenth International Conference}} on {{Machine Learning}}},
  series = {{{ICML}} '99},
  publisher = {{Morgan Kaufmann Publishers Inc.}},
  urldate = {2019-01-21},
  date = {1999},
  pages = {278--287},
  author = {Ng, Andrew Y. and Harada, Daishi and Russell, Stuart J.},
  file = {/home/dimitri/Nextcloud/Zotero/storage/EFCC73Q2/Ng et al. - 1999 - Policy Invariance Under Reward Transformations Th.pdf}
}

Downloads: 0