Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization. Barde, P., Roy, J., Jeon, W., Pineau, J., Pal, C. J., & Nowrouzezahrai, D. CoRR, 2020. Paper bibtex @article{DBLP:journals/corr/abs-2006-13258,
author = {Paul Barde and
Julien Roy and
Wonseok Jeon and
Joelle Pineau and
Christopher J. Pal and
Derek Nowrouzezahrai},
title = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy
Optimization},
journal = {CoRR},
volume = {abs/2006.13258},
year = {2020},
url = {https://arxiv.org/abs/2006.13258},
eprinttype = {arXiv},
eprint = {2006.13258},
timestamp = {Wed, 01 Jul 2020 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2006-13258.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
Downloads: 0
{"_id":"rGkr4xtC7QYJyJ2ub","bibbaseid":"barde-roy-jeon-pineau-pal-nowrouzezahrai-adversarialsoftadvantagefittingimitationlearningwithoutpolicyoptimization-2020","author_short":["Barde, P.","Roy, J.","Jeon, W.","Pineau, J.","Pal, C. J.","Nowrouzezahrai, D."],"bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Paul"],"propositions":[],"lastnames":["Barde"],"suffixes":[]},{"firstnames":["Julien"],"propositions":[],"lastnames":["Roy"],"suffixes":[]},{"firstnames":["Wonseok"],"propositions":[],"lastnames":["Jeon"],"suffixes":[]},{"firstnames":["Joelle"],"propositions":[],"lastnames":["Pineau"],"suffixes":[]},{"firstnames":["Christopher","J."],"propositions":[],"lastnames":["Pal"],"suffixes":[]},{"firstnames":["Derek"],"propositions":[],"lastnames":["Nowrouzezahrai"],"suffixes":[]}],"title":"Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization","journal":"CoRR","volume":"abs/2006.13258","year":"2020","url":"https://arxiv.org/abs/2006.13258","eprinttype":"arXiv","eprint":"2006.13258","timestamp":"Wed, 01 Jul 2020 01:00:00 +0200","biburl":"https://dblp.org/rec/journals/corr/abs-2006-13258.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-2006-13258,\n author = {Paul Barde and\n Julien Roy and\n Wonseok Jeon and\n Joelle Pineau and\n Christopher J. Pal and\n Derek Nowrouzezahrai},\n title = {Adversarial Soft Advantage Fitting: Imitation Learning without Policy\n Optimization},\n journal = {CoRR},\n volume = {abs/2006.13258},\n year = {2020},\n url = {https://arxiv.org/abs/2006.13258},\n eprinttype = {arXiv},\n eprint = {2006.13258},\n timestamp = {Wed, 01 Jul 2020 01:00:00 +0200},\n biburl = {https://dblp.org/rec/journals/corr/abs-2006-13258.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Barde, P.","Roy, J.","Jeon, W.","Pineau, J.","Pal, C. J.","Nowrouzezahrai, D."],"key":"DBLP:journals/corr/abs-2006-13258","id":"DBLP:journals/corr/abs-2006-13258","bibbaseid":"barde-roy-jeon-pineau-pal-nowrouzezahrai-adversarialsoftadvantagefittingimitationlearningwithoutpolicyoptimization-2020","role":"author","urls":{"Paper":"https://arxiv.org/abs/2006.13258"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://dblp.org/pid/30/4225.bib","dataSources":["6SeDWrH8eZcL7m8iW"],"keywords":[],"search_terms":["adversarial","soft","advantage","fitting","imitation","learning","without","policy","optimization","barde","roy","jeon","pineau","pal","nowrouzezahrai"],"title":"Adversarial Soft Advantage Fitting: Imitation Learning without Policy Optimization","year":2020}