Using Advice in Model-Based Reinforcement Learning. Toro Icarte, R., Klassen, T., Valenzano, R., & McIlraith, S. A. In Proceedings of the Multi-disciplinary Conference on Reinforcement Learning and Decision Making (RLDM), pages 199-203, 2017. bibtex @inproceedings{tor-etal-rldm17,
author = {Rodrigo {Toro Icarte} and
Toryn Klassen and
Richard Valenzano and
Sheila A. McIlraith},
title = {Using Advice in Model-Based Reinforcement Learning},
booktitle = {Proceedings of the Multi-disciplinary Conference on Reinforcement Learning and Decision Making ({RLDM})},
pages={199-203},
year = {2017}
}
Downloads: 0
{"_id":"fdCL9FNmqLTSRg9cD","bibbaseid":"toroicarte-klassen-valenzano-mcilraith-usingadviceinmodelbasedreinforcementlearning-2017","downloads":0,"creationDate":"2018-04-23T02:57:16.501Z","title":"Using Advice in Model-Based Reinforcement Learning","author_short":["Toro Icarte, R.","Klassen, T.","Valenzano, R.","McIlraith, S. A."],"year":2017,"bibtype":"inproceedings","biburl":"https://www.cs.toronto.edu/~sheila/publications/list.bib","bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"firstnames":["Rodrigo"],"propositions":[],"lastnames":["Toro Icarte"],"suffixes":[]},{"firstnames":["Toryn"],"propositions":[],"lastnames":["Klassen"],"suffixes":[]},{"firstnames":["Richard"],"propositions":[],"lastnames":["Valenzano"],"suffixes":[]},{"firstnames":["Sheila","A."],"propositions":[],"lastnames":["McIlraith"],"suffixes":[]}],"title":"Using Advice in Model-Based Reinforcement Learning","booktitle":"Proceedings of the Multi-disciplinary Conference on Reinforcement Learning and Decision Making (RLDM)","pages":"199-203","year":"2017","bibtex":"@inproceedings{tor-etal-rldm17,\n author = {Rodrigo {Toro Icarte} and\n Toryn Klassen and\n Richard Valenzano and\n Sheila A. McIlraith},\n title = {Using Advice in Model-Based Reinforcement Learning},\n booktitle = {Proceedings of the Multi-disciplinary Conference on Reinforcement Learning and Decision Making ({RLDM})},\n pages={199-203},\n year = {2017}\n}\n\n","author_short":["Toro Icarte, R.","Klassen, T.","Valenzano, R.","McIlraith, S. A."],"key":"tor-etal-rldm17","id":"tor-etal-rldm17","bibbaseid":"toroicarte-klassen-valenzano-mcilraith-usingadviceinmodelbasedreinforcementlearning-2017","role":"author","urls":{},"metadata":{"authorlinks":{"toro icarte, r":"https://www.cs.toronto.edu/~toryn/test/publications/reward_machines.html","mcilraith, s":"https://www.cs.toronto.edu/~sheila/preferences/"}},"downloads":0},"search_terms":["using","advice","model","based","reinforcement","learning","toro icarte","klassen","valenzano","mcilraith"],"keywords":[],"authorIDs":["2JP7Eg9bhybNpzYiR","3b3gnNFqBHiteKXs2","3wSJLXJ9XuZ2mDm2H","49zg6n33JhWCCjH4G","4zKMDaLdYLdgGQChe","5456dccd8b01c81930000008","5Eidhk5inwxxe7JGk","5baeaf7a91342d10000001cb","5bbfaade26813d10000000c0","5bc20a498d625410000000a0","5de9e8f29f521ddf010000f4","5dea039cfac96fde010000ad","5dea0c58fac96fde01000141","5df2ea54b91ab0de010000ea","5dfb881fc2820bdf010001a1","5e046c906ef264df010000b9","5e10276e2ef76bdf0100009f","5e129793551229df010000b6","5e162befdf1bb4de01000116","5e1e7705ce9ed9de0100012a","5e26328524c8a6de0100006d","5e2723abf51e02de010001fb","5e2784f755fc50df01000004","5e28be096acacbdf010000d4","5e326f1a5633c9de010000b0","5e3555a950cde4de0100000c","5e37c25d56571fde0100003d","5e380024918d4ede01000092","5e386d181f8af9e00100009b","5e390326dc5b8ade010000ac","5e3c31bf34cd37de01000126","5e4cec0e3e28aede0100012b","5e4f53598a3535f3010000cd","5e50202c933046de01000185","5e55431aca58a8df0100019a","5e5a1adc3557f5df010000c2","5e5c3b1e68f281de01000026","5e5e9d8bc0a53dde01000251","5e601cf3c064fcde010001dd","5e65c1b1d92058de010000e3","5e665cdd46e828de0100014d","5rfKneErnpvH8A9jA","6RJeJwCaTdt9z5nYv","6vPX7dp4BL2qMjx2i","7bxyKKMGnHxEQh3cj","7deQZsScCfPeKMrqy","7wFQb9PYwsS7Meg7i","9jPSyMaccQATNQzFR","AtaDzKGXz9bfKWfab","BsZbZovaHNF4dA3SG","CzTmxSkSkem3essqH","DPH6F3udnr4WBuFRg","GKYqrPg3uj7nu7nbt","GvvCbq8Y4n9QqTySC","HF25KvZDEBf5Nvp8x","HTN44dpu77wAWF8HE","HhKYdEPpCZAmKPPQc","J5FZeQWmDd6p96K8P","JDoXnkWb7QmkjpPqn","JGfakYisbgxjaayRF","KwLm5LfL8LpgKk8XJ","LwbwhDPiGy5gvQipm","NJYBJe35TWp5FARRc","Ni37kLLmf4zgkdNFZ","RStoeQpfqvDsMSLzJ","T9PWjMkNwX9WQ5frZ","TuqvMAPdZhcxfZKp7","Wipe7PE2hMCo9rb5r","WqZpp9fP47artme8L","XCnXFqMPKPFkRq2kj","XELkWriNsABzHMyaw","XEMAfXz5wSaaLnBkk","aXBRouHw2x2TwqbuE","ah2FNqZqgqkMf7rno","dSvyDxvHdpJ3uQRZS","goc5YRXzjuZMrzKik","htrNC4rPDzh6zfTLS","iEMJPovEGF7jk6vBD","iWkYLX2HSxaiwbphr","j9wxxJ9nPog3bHXaY","jArTXYwhaXss62KJk","jDsmsaB2wJpvPgxE4","kSfpomb2i9SWgtiBN","kx2M4GyrQDBEqRT4q","m6X7Yg32T74Fxxn2d","nvsBeFCxyzjQRGPSi","pRtcYGMaZMG8GTaSz","paM4BdJgmXhvmhNf8","tRLzqBJWc3TYzBYox","tmHrh8yBFTwMrLukn","uxproQToHm4wEZeph","vReYR7kzq7n4RR9Ng","wGWyTtcLspnfJaLeT","x6aX8g9rWCY5wzyW2","xW8eSNRWi7bXhQuHC","xZ6wRPENk64YNgMr7","xm2sosMHyKsPj85Pb","ybLsHWfLgzQZAQ5WE","zsNPuARLzosfgmFwd"],"dataSources":["FAyKHaeKDYM4aGJk2","euD7cPywCk5gX9zDY","optQ3PYGE2PxhriFJ","2LLKDfkxMDdABm58M","T3oedZczBnZ2Y6GvJ","Jwuh2BtHasSBPk4uf"]}