@inproceedings{e681015be5b94647986e4533a1c724b4,
title = "An Iterative Scheme of Safe Reinforcement Learning for Nonlinear Systems via Barrier Certificate Generation",
abstract = "In this paper, we propose a safe reinforcement learning approach to synthesize deep neural network (DNN) controllers for nonlinear systems subject to safety constraints. The proposed approach employs an iterative scheme where a learner and a verifier interact to synthesize safe DNN controllers. The learner trains a DNN controller via deep reinforcement learning, and the verifier certifies the learned controller through computing a maximal safe initial region and its corresponding barrier certificate, based on polynomial abstraction and bilinear matrix inequalities solving. Compared with the existing verification-in-the-loop synthesis methods, our iterative framework is a sequential synthesis scheme of controllers and barrier certificates, which can learn safe controllers with adaptive barrier certificates rather than user-defined ones. We implement the tool SRLBC and evaluate its performance over a set of benchmark examples. The experimental results demonstrate that our approach efficiently synthesizes safe DNN controllers even for a nonlinear system with dimension up to 12.",
keywords = "Barrier certificates, Continuous dynamical systems, Formal verification, Safe reinforcement learning",
author = "Zhengfeng Yang and Yidan Zhang and Wang Lin and Xia Zeng and Xiaochao Tang and Zhenbing Zeng and Zhiming Liu",
note = "Publisher Copyright: {\textcopyright} 2021, The Author(s).; 33rd International Conference on Computer Aided Verification, CAV 2021 ; Conference date: 20-07-2021 Through 23-07-2021",
year = "2021",
doi = "10.1007/978-3-030-81685-8\_22",
language = "英语",
isbn = "9783030816841",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "467--490",
editor = "Alexandra Silva and Leino, \{K. Rustan\}",
booktitle = "Computer Aided Verification - 33rd International Conference, CAV 2021, Proceedings",
address = "德国",
}