Proximal Policy Optimization Algorithms. Schulman, J., Wolski, F., Dhariwal, P., Radford, A., & Klimov, O. 2017.
bibtex   
@misc{schulman2017proximalpolicyoptimizationalgorithms,
      title={Proximal Policy Optimization Algorithms}, 
      author={John Schulman and Filip Wolski and Prafulla Dhariwal and Alec Radford and Oleg Klimov},
      year={2017},
      eprint={1707.06347},
      archivePrefix={arXiv},
      primaryClass={cs.LG},
      %url={https://arxiv.org/abs/1707.06347}, 
}

Downloads: 0