The Dynamics of Reinforcement Learning in Cooperative Multiagent Systems

The Dynamics of Reinforcement Learning in Cooperative Multiagent Systems. Claus, C. & Boutilier, C.
abstract bibtex

Reinforcement learning can provide a robust and natural means for agents to learn how to coordinate their action choices in multiagent systems. We examine some of the factors that can inﬂuence the dynamics of the learning process in such a setting. We ﬁrst distinguish reinforcement learners that are unaware of (or ignore) the presence of other agents from those that explicitly attempt to learn the value of joint actions and the strategies of their counterparts. We study (a simple form of) Q-learning in cooperative multiagent systems under these two perspectives, focusing on the inﬂuence of that game structure and exploration strategies on convergence to (optimal and suboptimal) Nash equilibria. We then propose alternative optimistic exploration strategies that increase the likelihood of convergence to an optimal equilibrium.

@article{claus_dynamics_nodate,
	title = {The {Dynamics} of {Reinforcement} {Learning} in {Cooperative} {Multiagent} {Systems}},
	abstract = {Reinforcement learning can provide a robust and natural means for agents to learn how to coordinate their action choices in multiagent systems. We examine some of the factors that can inﬂuence the dynamics of the learning process in such a setting. We ﬁrst distinguish reinforcement learners that are unaware of (or ignore) the presence of other agents from those that explicitly attempt to learn the value of joint actions and the strategies of their counterparts. We study (a simple form of) Q-learning in cooperative multiagent systems under these two perspectives, focusing on the inﬂuence of that game structure and exploration strategies on convergence to (optimal and suboptimal) Nash equilibria. We then propose alternative optimistic exploration strategies that increase the likelihood of convergence to an optimal equilibrium.},
	language = {en},
	author = {Claus, Caroline and Boutilier, Craig},
	pages = {7}
}

Downloads: 0

{"_id":"MjgfrJNw3z6oErLFS","bibbaseid":"claus-boutilier-thedynamicsofreinforcementlearningincooperativemultiagentsystems","authorIDs":[],"author_short":["Claus, C.","Boutilier, C."],"bibdata":{"bibtype":"article","type":"article","title":"The Dynamics of Reinforcement Learning in Cooperative Multiagent Systems","abstract":"Reinforcement learning can provide a robust and natural means for agents to learn how to coordinate their action choices in multiagent systems. We examine some of the factors that can inﬂuence the dynamics of the learning process in such a setting. We ﬁrst distinguish reinforcement learners that are unaware of (or ignore) the presence of other agents from those that explicitly attempt to learn the value of joint actions and the strategies of their counterparts. We study (a simple form of) Q-learning in cooperative multiagent systems under these two perspectives, focusing on the inﬂuence of that game structure and exploration strategies on convergence to (optimal and suboptimal) Nash equilibria. We then propose alternative optimistic exploration strategies that increase the likelihood of convergence to an optimal equilibrium.","language":"en","author":[{"propositions":[],"lastnames":["Claus"],"firstnames":["Caroline"],"suffixes":[]},{"propositions":[],"lastnames":["Boutilier"],"firstnames":["Craig"],"suffixes":[]}],"pages":"7","bibtex":"@article{claus_dynamics_nodate,\n\ttitle = {The {Dynamics} of {Reinforcement} {Learning} in {Cooperative} {Multiagent} {Systems}},\n\tabstract = {Reinforcement learning can provide a robust and natural means for agents to learn how to coordinate their action choices in multiagent systems. We examine some of the factors that can inﬂuence the dynamics of the learning process in such a setting. We ﬁrst distinguish reinforcement learners that are unaware of (or ignore) the presence of other agents from those that explicitly attempt to learn the value of joint actions and the strategies of their counterparts. We study (a simple form of) Q-learning in cooperative multiagent systems under these two perspectives, focusing on the inﬂuence of that game structure and exploration strategies on convergence to (optimal and suboptimal) Nash equilibria. We then propose alternative optimistic exploration strategies that increase the likelihood of convergence to an optimal equilibrium.},\n\tlanguage = {en},\n\tauthor = {Claus, Caroline and Boutilier, Craig},\n\tpages = {7}\n}\n\n","author_short":["Claus, C.","Boutilier, C."],"key":"claus_dynamics_nodate","id":"claus_dynamics_nodate","bibbaseid":"claus-boutilier-thedynamicsofreinforcementlearningincooperativemultiagentsystems","role":"author","urls":{},"downloads":0,"html":""},"bibtype":"article","biburl":"https://bibbase.org/zotero/asneha213","creationDate":"2019-07-08T00:48:54.943Z","downloads":0,"keywords":[],"search_terms":["dynamics","reinforcement","learning","cooperative","multiagent","systems","claus","boutilier"],"title":"The Dynamics of Reinforcement Learning in Cooperative Multiagent Systems","year":null,"dataSources":["fjacg9txEnNSDwee6"]}