Using Reward Machines for High-Level Task Specification and Decomposition in Reinforcement Learning. Toro Icarte, R., Klassen, T. Q., Valenzano, R., & McIlraith, S. A. In Proceedings of the 35th International Conference on Machine Learning (ICML), pages 2112-2121, 2018. Paper Code bibtex 41 downloads @inproceedings{tor-etal-icml18,
author = {Rodrigo {Toro Icarte} and
Toryn Q. Klassen and
Richard Valenzano and
Sheila A. McIlraith},
title = {Using Reward Machines for High-Level Task Specification and Decomposition in Reinforcement Learning},
booktitle = {Proceedings of the 35th International Conference on Machine Learning (ICML)},
year = {2018},
url = {http://proceedings.mlr.press/v80/icarte18a.html},
url_code = {https://bitbucket.org/RToroIcarte/qrm},
pages = {2112-2121},
keywords = {reward machines, reinforcement learning}
}
Downloads: 41
{"_id":"jQcgmjWZcrzRwq4dx","bibbaseid":"toroicarte-klassen-valenzano-mcilraith-usingrewardmachinesforhighleveltaskspecificationanddecompositioninreinforcementlearning-2018","downloads":44,"creationDate":"2018-06-10T21:09:41.186Z","title":"Using Reward Machines for High-Level Task Specification and Decomposition in Reinforcement Learning","author_short":["Toro Icarte, R.","Klassen, T. Q.","Valenzano, R.","McIlraith, S. A."],"year":2018,"bibtype":"inproceedings","biburl":"https://www.cs.toronto.edu/~sheila/publications/list.bib","bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Rodrigo"],"propositions":[],"lastnames":["Toro Icarte"],"suffixes":[]},{"firstnames":["Toryn","Q."],"propositions":[],"lastnames":["Klassen"],"suffixes":[]},{"firstnames":["Richard"],"propositions":[],"lastnames":["Valenzano"],"suffixes":[]},{"firstnames":["Sheila","A."],"propositions":[],"lastnames":["McIlraith"],"suffixes":[]}],"title":"Using Reward Machines for High-Level Task Specification and Decomposition in Reinforcement Learning","booktitle":"Proceedings of the 35th International Conference on Machine Learning (ICML)","year":"2018","url":"http://proceedings.mlr.press/v80/icarte18a.html","url_code":"https://bitbucket.org/RToroIcarte/qrm","pages":"2112-2121","keywords":"reward machines, reinforcement learning","bibtex":"@inproceedings{tor-etal-icml18,\n author = {Rodrigo {Toro Icarte} and\n Toryn Q. Klassen and\n Richard Valenzano and\n Sheila A. McIlraith},\n title = {Using Reward Machines for High-Level Task Specification and Decomposition in Reinforcement Learning},\n booktitle = {Proceedings of the 35th International Conference on Machine Learning (ICML)},\n year = {2018},\n url = {http://proceedings.mlr.press/v80/icarte18a.html},\n url_code = {https://bitbucket.org/RToroIcarte/qrm},\n pages = {2112-2121},\n keywords = {reward machines, reinforcement learning}\n}\n\n","author_short":["Toro Icarte, R.","Klassen, T. Q.","Valenzano, R.","McIlraith, S. A."],"key":"tor-etal-icml18","id":"tor-etal-icml18","bibbaseid":"toroicarte-klassen-valenzano-mcilraith-usingrewardmachinesforhighleveltaskspecificationanddecompositioninreinforcementlearning-2018","role":"author","urls":{"Paper":"http://proceedings.mlr.press/v80/icarte18a.html"," code":"https://bitbucket.org/RToroIcarte/qrm"},"keyword":["reward machines","reinforcement learning"],"metadata":{"authorlinks":{"toro icarte, r":"https://www.cs.toronto.edu/~toryn/test/publications/reward_machines.html","mcilraith, s":"https://www.cs.toronto.edu/~sheila/preferences/"}},"downloads":41},"search_terms":["using","reward","machines","high","level","task","specification","decomposition","reinforcement","learning","toro icarte","klassen","valenzano","mcilraith"],"keywords":["reward machines","reinforcement learning"],"authorIDs":["2JP7Eg9bhybNpzYiR","3b3gnNFqBHiteKXs2","3wSJLXJ9XuZ2mDm2H","49zg6n33JhWCCjH4G","4zKMDaLdYLdgGQChe","5456dccd8b01c81930000008","5baeaf7a91342d10000001cb","5bbfaade26813d10000000c0","5bc20a498d625410000000a0","5e390326dc5b8ade010000ac","6RJeJwCaTdt9z5nYv","7bxyKKMGnHxEQh3cj","7deQZsScCfPeKMrqy","7wFQb9PYwsS7Meg7i","BsZbZovaHNF4dA3SG","GKYqrPg3uj7nu7nbt","GvvCbq8Y4n9QqTySC","HF25KvZDEBf5Nvp8x","HhKYdEPpCZAmKPPQc","J5FZeQWmDd6p96K8P","LwbwhDPiGy5gvQipm","NJYBJe35TWp5FARRc","Ni37kLLmf4zgkdNFZ","RStoeQpfqvDsMSLzJ","T9PWjMkNwX9WQ5frZ","TuqvMAPdZhcxfZKp7","Wipe7PE2hMCo9rb5r","WqZpp9fP47artme8L","XCnXFqMPKPFkRq2kj","XEMAfXz5wSaaLnBkk","goc5YRXzjuZMrzKik","iEMJPovEGF7jk6vBD","iWkYLX2HSxaiwbphr","j9wxxJ9nPog3bHXaY","jArTXYwhaXss62KJk","jDsmsaB2wJpvPgxE4","kx2M4GyrQDBEqRT4q","m6X7Yg32T74Fxxn2d","nvsBeFCxyzjQRGPSi","paM4BdJgmXhvmhNf8","tRLzqBJWc3TYzBYox","vReYR7kzq7n4RR9Ng","x6aX8g9rWCY5wzyW2","xW8eSNRWi7bXhQuHC","xm2sosMHyKsPj85Pb","ybLsHWfLgzQZAQ5WE","zsNPuARLzosfgmFwd"],"dataSources":["FAyKHaeKDYM4aGJk2","euD7cPywCk5gX9zDY","optQ3PYGE2PxhriFJ","2LLKDfkxMDdABm58M","T3oedZczBnZ2Y6GvJ","Jwuh2BtHasSBPk4uf"]}