BetaZero: Belief-state planning for long-horizon POMDPs using learned approximations. Moss, R. J., Corso, A., Caers, J., & Kochenderfer, M. J. In Reinforcement Learning Conference, 2024.
BetaZero: Belief-state planning for long-horizon POMDPs using learned approximations [link]Paper  bibtex   3 downloads  
@InProceedings{Moss2024rlc,
    author = {Robert J. Moss and Anthony Corso and Jef Caers and Mykel J. Kochenderfer},
    booktitle = {Reinforcement Learning Conference},
    title = {Beta{Z}ero: {B}elief-state planning for long-horizon {POMDP}s using learned approximations},
    year = {2024},
    url = {https://arxiv.org/abs/2306.00249},
}

Downloads: 3