Planning with partially specified behaviors. Segovia-Aguas, J., Ferrer-Mestres, J., & Jonsson, A. Volume 288 , 2016.
doi  abstract   bibtex   
© 2016 The authors and IOS Press. All rights reserved. In this paper we present a framework called Planning with Partially Specified Behaviors, or PPSB, for combining reinforcement learning and planning to solve sequential decision problems. Although not often combined, we show that reinforcement learning and planning complement each other well, in that each can take advantage of the strengths of the other. PPSB uses partial action specifications to decompose sequential decision problems into tasks that serve as an interface between reinforcement learning and planning. On the bottom level, we use reinforcement learning to compute policies for achieving each individual task. On the top level, we use planning to produce a sequence of tasks that achieves an overall goal. We validate PPSB in experiments in which a robot has to perform tasks in a realistic simulated environment.
@book{
 title = {Planning with partially specified behaviors},
 type = {book},
 year = {2016},
 source = {Frontiers in Artificial Intelligence and Applications},
 keywords = {Agent Programming,Classical Planning,Hierachical Decomposition,Reinforcement Learning},
 volume = {288},
 id = {08216ed4-2fcc-3fab-a0d7-4dc171d88fe2},
 created = {2018-07-16T07:35:57.876Z},
 file_attached = {false},
 profile_id = {de5765e4-e253-3166-8178-333c824974ba},
 last_modified = {2018-07-16T07:35:57.876Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {false},
 hidden = {false},
 private_publication = {false},
 abstract = {© 2016 The authors and IOS Press. All rights reserved. In this paper we present a framework called Planning with Partially Specified Behaviors, or PPSB, for combining reinforcement learning and planning to solve sequential decision problems. Although not often combined, we show that reinforcement learning and planning complement each other well, in that each can take advantage of the strengths of the other. PPSB uses partial action specifications to decompose sequential decision problems into tasks that serve as an interface between reinforcement learning and planning. On the bottom level, we use reinforcement learning to compute policies for achieving each individual task. On the top level, we use planning to produce a sequence of tasks that achieves an overall goal. We validate PPSB in experiments in which a robot has to perform tasks in a realistic simulated environment.},
 bibtype = {book},
 author = {Segovia-Aguas, J. and Ferrer-Mestres, J. and Jonsson, A.},
 doi = {10.3233/978-1-61499-696-5-263}
}

Downloads: 0