@inproceedings{ebec9feecbf749ecb9563215e967b030,
title = "Stackelberg Meta-Learning Based Control for Guided Cooperative LQG Systems",
abstract = "Guided cooperation allows intelligent agents with heterogeneous capabilities to work together by following a leader-follower type of interaction. However, the associated control problem becomes challenging when the leader agent does not have complete information about follower agents. There is a need for learning and adaptation of cooperation plans. To this end, we develop a meta-learning-based Stackelberg game-theoretic framework to address the challenges in the guided cooperative control for linear systems. We first formulate the guided cooperation between agents as a dynamic Stackelberg game and use the feedback Stackelberg equilibrium as the agent-wise cooperation strategy. We further leverage meta-learning to address the incomplete information of follower agents, where the leader agent learns a meta-response model from a prescribed set of followers offline and adapts to a new coming cooperation task with a small amount of learning data. We use a case study in robot teaming to corroborate the effectiveness of our framework. Comparison with other learning approaches also shows that our learned cooperation strategy provides better transferability for different cooperation tasks.",
keywords = "Adaptive control of multi-agent systems, Data-driven control, Dynamic games, Intelligent robotics, Learning for control, Linear systems",
author = "Yuhan Zhao and Quanyan Zhu",
note = "Publisher Copyright: Copyright {\textcopyright} 2023 The Authors. This is an open access article under the CC BY-NC-ND license (https://creativecommons.org/licenses/by-nc-nd/4.0/); 22nd IFAC World Congress ; Conference date: 09-07-2023 Through 14-07-2023",
year = "2023",
month = jul,
day = "1",
doi = "10.1016/j.ifacol.2023.10.884",
language = "English (US)",
series = "IFAC-PapersOnLine",
publisher = "Elsevier B.V.",
number = "2",
pages = "10120--10125",
editor = "Hideaki Ishii and Yoshio Ebihara and Jun-ichi Imura and Masaki Yamakita",
booktitle = "IFAC-PapersOnLine",
edition = "2",
}