Policy Search for the Optimal Control of Markov Decision Processes: A Novel Particle-Based Iterative Scheme. Manganini, G., Pirotta, M., Restelli, M., Piroddi, L., & Prandini, M. IEEE TRANSACTIONS ON CYBERNETICS, 46(11):2643--2655, 2016.
doi  bibtex   
@article{manganini_policy_2016,
	title = {Policy {Search} for the {Optimal} {Control} of {Markov} {Decision} {Processes}: {A} {Novel} {Particle}-{Based} {Iterative} {Scheme}},
	volume = {46},
	doi = {10.1109/TCYB.2015.2483780},
	number = {11},
	journal = {IEEE TRANSACTIONS ON CYBERNETICS},
	author = {Manganini, Giorgio and Pirotta, Matteo and Restelli, Marcello and Piroddi, Luigi and Prandini, Maria},
	year = {2016},
	pages = {2643--2655}
}

Downloads: 0