@inproceedings{f5df300125144478a6eb57d5d8132079,
title = "H∞ optimal control of unknown linear discrete-time systems: An off-policy reinforcement learning approach",
abstract = "This paper proposes a model-free H∞ control design for linear discrete-time systems using reinforcement learning (RL). A novel off-policy RL algorithm is used to solve the game algebraic Riccati equation (GARE) online using the measured data along the system trajectories. The proposed RL algorithm has the following advantages compared to existing model-free RL methods for solving H∞ control problem: 1) It is data efficient and fast since a stream of experiences which is obtained from executing a fixed behavioral policy is reused to update many value functions correspond to different leaning policies sequentially. 2) The disturbance input does not need to be adjusted in a specific manner. 3) There is no bias as a result of adding a probing noise to the control input to maintain persistence of excitation conditions. A simulation example is used to verify the effectiveness of the proposed control scheme.",
keywords = "H control, game algebraic Riccati equation, off-policy, reinforcement learning",
author = "Bahare Kiumarsi and Hamidreza Modares and Lewis, {Frank L.} and Jiang, {Zhong Ping}",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 7th IEEE International Conference on Cybernetics and Intelligent Systems, CIS 2015 and the 7th IEEE International Conference on Robotics, Automation and Mechatronics, RAM 2015 ; Conference date: 15-07-2015 Through 17-07-2015",
year = "2015",
month = sep,
day = "23",
doi = "10.1109/ICCIS.2015.7274545",
language = "English (US)",
series = "Proceedings of the 2015 7th IEEE International Conference on Cybernetics and Intelligent Systems, CIS 2015 and Robotics, Automation and Mechatronics, RAM 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "41--46",
booktitle = "Proceedings of the 2015 7th IEEE International Conference on Cybernetics and Intelligent Systems, CIS 2015 and Robotics, Automation and Mechatronics, RAM 2015",
}