Convergence Results for Single-Step On-Policy Reinforcement Learning Algorithms. Singh, S., Jaakkola, T., Littman, M. L., & Szepesv́ari, C. Machine Learning, 1998. To appear
bibtex   
@article{ singh-jaak-littman-sze:ml98,
  author = {Satinder Singh and Tommi Jaakkola and Michael L. Littman and Csaba Szepesv́{a}ri},
  journal = {Machine Learning},
  note = {To appear},
  title = {Convergence Results for Single-Step On-Policy Reinforcement Learning Algorithms},
  year = {1998}
}

Downloads: 0