{"_id":"eHLFqXbyhksfRBfzG","bibbaseid":"bastani-pu-solarlezama-verifiablereinforcementlearningviapolicyextraction-2018","author_short":["Bastani, O.","Pu, Y.","Solar-Lezama, A."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Osbert"],"propositions":[],"lastnames":["Bastani"],"suffixes":[]},{"firstnames":["Yewen"],"propositions":[],"lastnames":["Pu"],"suffixes":[]},{"firstnames":["Armando"],"propositions":[],"lastnames":["Solar-Lezama"],"suffixes":[]}],"title":"Verifiable Reinforcement Learning via Policy Extraction","booktitle":"Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montréal, Canada","pages":"2499–2509","year":"2018","crossref":"DBLP:conf/nips/2018","url":"https://proceedings.neurips.cc/paper/2018/hash/e6d8545daa42d5ced125a4bf747b3688-Abstract.html","timestamp":"Mon, 16 May 2022 15:41:51 +0200","biburl":"https://dblp.org/rec/conf/nips/BastaniPS18.bib","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@inproceedings{DBLP:conf/nips/BastaniPS18,\n author = {Osbert Bastani and\n Yewen Pu and\n Armando Solar{-}Lezama},\n title = {Verifiable Reinforcement Learning via Policy Extraction},\n booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference\n on Neural Information Processing Systems 2018, NeurIPS 2018, December\n 3-8, 2018, Montr{\\'{e}}al, Canada},\n pages = {2499--2509},\n year = {2018},\n crossref = {DBLP:conf/nips/2018},\n url = {https://proceedings.neurips.cc/paper/2018/hash/e6d8545daa42d5ced125a4bf747b3688-Abstract.html},\n timestamp = {Mon, 16 May 2022 15:41:51 +0200},\n biburl = {https://dblp.org/rec/conf/nips/BastaniPS18.bib},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Bastani, O.","Pu, Y.","Solar-Lezama, A."],"key":"DBLP:conf/nips/BastaniPS18","id":"DBLP:conf/nips/BastaniPS18","bibbaseid":"bastani-pu-solarlezama-verifiablereinforcementlearningviapolicyextraction-2018","role":"author","urls":{"Paper":"https://proceedings.neurips.cc/paper/2018/hash/e6d8545daa42d5ced125a4bf747b3688-Abstract.html"},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"http://dblp.org/pers/tb2/s/Solar=Lezama:Armando","dataSources":["DAnxudWukpMXCtWy8"],"keywords":[],"search_terms":["verifiable","reinforcement","learning","via","policy","extraction","bastani","pu","solar-lezama"],"title":"Verifiable Reinforcement Learning via Policy Extraction","year":2018}