@Article{cmc.2023.041253,
AUTHOR = {Tengda Li, Gang Wang, Qiang Fu, Xiangke Guo, Minrui Zhao, Xiangyu Liu},
TITLE = {An Intelligent Algorithm for Solving Weapon-Target Assignment Problem: DDPG-DNPE Algorithm},
JOURNAL = {Computers, Materials \& Continua},
VOLUME = {76},
YEAR = {2023},
NUMBER = {3},
PAGES = {3499--3522},
URL = {http://www.techscience.com/cmc/v76n3/54375},
ISSN = {1546-2226},
ABSTRACT = {Aiming at the problems of traditional dynamic weapon-target assignment algorithms in command decision-making, such as large computational amount, slow solution speed, and low calculation accuracy, combined with deep reinforcement learning theory, an improved Deep Deterministic Policy Gradient algorithm with dual noise and prioritized experience replay is proposed, which uses a double noise mechanism to expand the search range of the action, and introduces a priority experience playback mechanism to effectively achieve data utilization. Finally, the algorithm is simulated and validated on the ground-to-air countermeasures digital battlefield. The results of the experiment show that, under the framework of the deep neural network for intelligent weapon-target assignment proposed in this paper, compared to the traditional RELU algorithm, the agent trained with reinforcement learning algorithms, such as Deep Deterministic Policy Gradient algorithm, Asynchronous Advantage Actor-Critic algorithm, Deep Q Network algorithm performs better. It shows that the use of deep reinforcement learning algorithms to solve the weapon-target assignment problem in the field of air defense operations is scientific. In contrast to other reinforcement learning algorithms, the agent trained by the improved Deep Deterministic Policy Gradient algorithm has a higher win rate and reward in confrontation, and the use of weapon resources is more efficient. It shows that the model and algorithm have certain superiority and rationality. The results of this paper provide new ideas for solving the problem of weapon-target assignment in air defense combat command decisions.},
DOI = {10.32604/cmc.2023.041253}
}