Safe Reinforcement Learning Through Regret and State Restorations in Evaluation Stages. Gros, T. P, Müller, N. J, Höller, D., & Wolf, V. 2024.
bibtex   
@article{gros2024safe,
	title={Safe Reinforcement Learning Through Regret and State Restorations in Evaluation Stages},
	author={Gros, Timo P and M{\"u}ller, Nicola J and H{\"o}ller, Daniel and Wolf, Verena},
	year={2024}
}

Downloads: 0