Convergence Results for Single-Step On-Policy Reinforcement Learning Algorithms. Singh, S., Jaakkola, T., Littman, M. L., & Szepesvári, C. Machine Learning, 1998. To appear
bibtex   
@article{singh-jaak-littman-sze:ml98,
	Author = {Satinder Singh and Tommi Jaakkola and Michael L. Littman and Csaba Szepesv\'{a}ri},
	Journal = {Machine Learning},
	Note = {To appear},
	Title = {Convergence Results for Single-Step On-Policy Reinforcement Learning Algorithms},
	Year = {1998}}

Downloads: 0