@inproceedings{0376f5c461834dd7bf35d4eb0b3564e7,
title = "Weighted Mean-Field Multi-Agent Reinforcement Learning via Reward Attribution Decomposition",
abstract = "Existing MARL algorithms have low efficiency in many-agent scenarios due to the complex dynamic interaction when agents growing exponentially. Mean-field theory has been introduced to improve the scalability where complex interactions are approximated by those between a single agent and the mean effect from neighbors. However, only considering the averaged actions of neighborhood at last step and ignoring the dynamic influence of neighbors leads to unstable training procedures and sub-optimal solutions. In this paper, the Weighted Mean-Field Multi-Agent Reinforcement Learning via Reward Attribution Decomposition (MFRAD) framework is proposed by differentiating heterogeneous and hysteresis neighbor effect with weighted mean-field approximation and reward attribution decomposition. The multi-head attention is employed to calculate the weights which formulate the weighted mean-field Q-function. To further eliminate the impact of hysteresis information, reward attribution decomposition is integrated to decompose weighted mean-field Q-value, improving the interpretability of MFRAD and achieving fully decentralized execution without information exchanging. Two novel regularization terms are also introduced to guarantee the consistency of temporal relationship among agents and unambiguity of local Q-value with no agents. Numerical experiments on many-agent scenarios demonstrate the superior performance against existing baselines.",
keywords = "Multi-agent reinforcement learning, Reward attribution decomposition, Weighted mean-field approximation",
author = "Tingyu Wu and Wenhao Li and Bo Jin and Wei Zhang and Xiangfeng Wang",
note = "Publisher Copyright: {\textcopyright} 2022, The Author(s), under exclusive license to Springer Nature Switzerland AG.; International Workshops on BDMS, BDQM, GDMA, IWBT, MAQTDS, and PMBD 2022, held in conjunction with the 27th International Conference on Database Systems for Advanced Applications, DASFAA 2022 ; Conference date: 11-04-2022 Through 14-04-2022",
year = "2022",
doi = "10.1007/978-3-031-11217-1\_22",
language = "英语",
isbn = "9783031112164",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "301--316",
editor = "Rage, \{Uday Kiran\} and Vikram Goyal and Reddy, \{P. Krishna\}",
booktitle = "Database Systems for Advanced Applications. DASFAA 2022 International Workshops - BDMS, BDQM, GDMA, IWBT, MAQTDS, and PMBD, Proceedings",
address = "德国",
}