@inproceedings{eb5f398103df476bb1e38fd72b909098,
title = "Battlefield agent alliance decision-making two layer reinforcement learning algorithm",
abstract = "in the background of Agent Alliance combat deduction, here we present a Two Layer Reinforcement learning algorithm, referred to a TLRL algorithm, for the special requirements of battlefield simulation environment Agents offensive and defensive decision-making study. The algorithm model is classified into two layers: one is the global decision-making Agent, called Commandant Agent, learning from the environment as well as both enemies' and friends' actions, the other is the Servant Agents optimizing the action by receiving local environment feedback. Finally the war situation deduction which is carried out on the simulation platform TBS we set up, has showed the fast convergence and effectiveness of this algorithm.",
keywords = "Agent alliance, Battlefield, Decision-making, Reinforcement learning",
author = "Xie, \{Zhi Jun\} and Dong, \{Chao Yang\} and Fei Yang and Wei Chen",
year = "2010",
doi = "10.1109/ICCASM.2010.5619247",
language = "英语",
isbn = "9781424472369",
series = "ICCASM 2010 - 2010 International Conference on Computer Application and System Modeling, Proceedings",
pages = "V1174--V1178",
booktitle = "ICCASM 2010 - 2010 International Conference on Computer Application and System Modeling, Proceedings",
note = "2010 International Conference on Computer Application and System Modeling, ICCASM 2010 ; Conference date: 22-10-2010 Through 24-10-2010",
}