Reward Machines: Exploiting Reward Function Structure in Reinforcement Learning. Icarte, R. T., Klassen, T. Q., Valenzano, R. A., & McIlraith, S. A. J. Artif. Intell. Res., 73:173-208, 2022.
Link
Paper bibtex @article{journals/jair/IcarteKVM22,
added-at = {2025-01-19T00:00:00.000+0100},
author = {Icarte, Rodrigo Toro and Klassen, Toryn Q. and Valenzano, Richard Anthony and McIlraith, Sheila A.},
biburl = {https://www.bibsonomy.org/bibtex/20796c1d250443375c329a734510544cd/dblp},
ee = {https://www.wikidata.org/entity/Q130953251},
interhash = {851d12347e8a5b2dcf529a75cef1ca90},
intrahash = {0796c1d250443375c329a734510544cd},
journal = {J. Artif. Intell. Res.},
keywords = {dblp},
pages = {173-208},
timestamp = {2025-01-27T08:15:56.000+0100},
title = {Reward Machines: Exploiting Reward Function Structure in Reinforcement Learning.},
url = {http://dblp.uni-trier.de/db/journals/jair/jair73.html#IcarteKVM22},
volume = 73,
year = 2022
}
Downloads: 0
{"_id":"4gMCHbwfdAsfpDNNy","bibbaseid":"icarte-klassen-valenzano-mcilraith-rewardmachinesexploitingrewardfunctionstructureinreinforcementlearning-2022","author_short":["Icarte, R. T.","Klassen, T. Q.","Valenzano, R. A.","McIlraith, S. A."],"bibdata":{"bibtype":"article","type":"article","added-at":"2025-01-19T00:00:00.000+0100","author":[{"propositions":[],"lastnames":["Icarte"],"firstnames":["Rodrigo","Toro"],"suffixes":[]},{"propositions":[],"lastnames":["Klassen"],"firstnames":["Toryn","Q."],"suffixes":[]},{"propositions":[],"lastnames":["Valenzano"],"firstnames":["Richard","Anthony"],"suffixes":[]},{"propositions":[],"lastnames":["McIlraith"],"firstnames":["Sheila","A."],"suffixes":[]}],"biburl":"https://www.bibsonomy.org/bibtex/20796c1d250443375c329a734510544cd/dblp","ee":"https://www.wikidata.org/entity/Q130953251","interhash":"851d12347e8a5b2dcf529a75cef1ca90","intrahash":"0796c1d250443375c329a734510544cd","journal":"J. Artif. Intell. Res.","keywords":"dblp","pages":"173-208","timestamp":"2025-01-27T08:15:56.000+0100","title":"Reward Machines: Exploiting Reward Function Structure in Reinforcement Learning.","url":"http://dblp.uni-trier.de/db/journals/jair/jair73.html#IcarteKVM22","volume":"73","year":"2022","bibtex":"@article{journals/jair/IcarteKVM22,\n added-at = {2025-01-19T00:00:00.000+0100},\n author = {Icarte, Rodrigo Toro and Klassen, Toryn Q. and Valenzano, Richard Anthony and McIlraith, Sheila A.},\n biburl = {https://www.bibsonomy.org/bibtex/20796c1d250443375c329a734510544cd/dblp},\n ee = {https://www.wikidata.org/entity/Q130953251},\n interhash = {851d12347e8a5b2dcf529a75cef1ca90},\n intrahash = {0796c1d250443375c329a734510544cd},\n journal = {J. Artif. Intell. Res.},\n keywords = {dblp},\n pages = {173-208},\n timestamp = {2025-01-27T08:15:56.000+0100},\n title = {Reward Machines: Exploiting Reward Function Structure in Reinforcement Learning.},\n url = {http://dblp.uni-trier.de/db/journals/jair/jair73.html#IcarteKVM22},\n volume = 73,\n year = 2022\n}\n\n","author_short":["Icarte, R. T.","Klassen, T. Q.","Valenzano, R. A.","McIlraith, S. A."],"key":"journals/jair/IcarteKVM22","id":"journals/jair/IcarteKVM22","bibbaseid":"icarte-klassen-valenzano-mcilraith-rewardmachinesexploitingrewardfunctionstructureinreinforcementlearning-2022","role":"author","urls":{"Link":"https://www.wikidata.org/entity/Q130953251","Paper":"http://dblp.uni-trier.de/db/journals/jair/jair73.html#IcarteKVM22"},"keyword":["dblp"],"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"http://www.bibsonomy.org/bib/author/Sheila McIlraith?items=1000","dataSources":["rQFxZQs78YQJ9m34s","uKBTF27RvvtN9Ryxw"],"keywords":["dblp"],"search_terms":["reward","machines","exploiting","reward","function","structure","reinforcement","learning","icarte","klassen","valenzano","mcilraith"],"title":"Reward Machines: Exploiting Reward Function Structure in Reinforcement Learning.","year":2022}