Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization. Barde, P., Roy, J., Jeon, W., Pineau, J., Pal, C. J., & Nowrouzezahrai, D. CoRR, 2020.
Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization [link]Paper  bibtex   
@article{DBLP:journals/corr/abs-2006-13258,
  author       = {Paul Barde and
                  Julien Roy and
                  Wonseok Jeon and
                  Joelle Pineau and
                  Christopher J. Pal and
                  Derek Nowrouzezahrai},
  title        = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy
                  Optimization},
  journal      = {CoRR},
  volume       = {abs/2006.13258},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13258},
  eprinttype    = {arXiv},
  eprint       = {2006.13258},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13258.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0