BetaZero: Belief-state planning for long-horizon POMDPs using learned approximations. Moss, R. J., Corso, A., Caers, J., & Kochenderfer, M. J. In Reinforcement Learning Conference, 2024.
Paper bibtex 3 downloads @InProceedings{Moss2024rlc,
author = {Robert J. Moss and Anthony Corso and Jef Caers and Mykel J. Kochenderfer},
booktitle = {Reinforcement Learning Conference},
title = {Beta{Z}ero: {B}elief-state planning for long-horizon {POMDP}s using learned approximations},
year = {2024},
url = {https://arxiv.org/abs/2306.00249},
}
Downloads: 3
{"_id":"uWJqw4GWHkwyKHNXK","bibbaseid":"moss-corso-caers-kochenderfer-betazerobeliefstateplanningforlonghorizonpomdpsusinglearnedapproximations-2024","author_short":["Moss, R. J.","Corso, A.","Caers, J.","Kochenderfer, M. J."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Robert","J."],"propositions":[],"lastnames":["Moss"],"suffixes":[]},{"firstnames":["Anthony"],"propositions":[],"lastnames":["Corso"],"suffixes":[]},{"firstnames":["Jef"],"propositions":[],"lastnames":["Caers"],"suffixes":[]},{"firstnames":["Mykel","J."],"propositions":[],"lastnames":["Kochenderfer"],"suffixes":[]}],"booktitle":"Reinforcement Learning Conference","title":"BetaZero: Belief-state planning for long-horizon POMDPs using learned approximations","year":"2024","url":"https://arxiv.org/abs/2306.00249","bibtex":"@InProceedings{Moss2024rlc,\n author = {Robert J. Moss and Anthony Corso and Jef Caers and Mykel J. Kochenderfer},\n booktitle = {Reinforcement Learning Conference},\n title = {Beta{Z}ero: {B}elief-state planning for long-horizon {POMDP}s using learned approximations},\n year = {2024},\n url = {https://arxiv.org/abs/2306.00249},\n}\n\n","author_short":["Moss, R. J.","Corso, A.","Caers, J.","Kochenderfer, M. J."],"key":"Moss2024rlc","id":"Moss2024rlc","bibbaseid":"moss-corso-caers-kochenderfer-betazerobeliefstateplanningforlonghorizonpomdpsusinglearnedapproximations-2024","role":"author","urls":{"Paper":"https://arxiv.org/abs/2306.00249"},"metadata":{"authorlinks":{}},"downloads":3,"html":""},"bibtype":"inproceedings","biburl":"https://ancorso.github.io/files/references.bib","dataSources":["Q5m4eREZKA5kKSYST","mSsYghgSmyfbF75po","L6He8KnRF8BusNwKm","bdnWRMC3puq7qTm42"],"keywords":[],"search_terms":["betazero","belief","state","planning","long","horizon","pomdps","using","learned","approximations","moss","corso","caers","kochenderfer"],"title":"BetaZero: Belief-state planning for long-horizon POMDPs using learned approximations","year":2024,"downloads":3}