@inproceedings{df0f1a5fbe324abe9fc28acbfa01e268,
title = "Collaborative Guidance Algorithm Based on Offline Pre-training and Online Reinforcement Learning",
abstract = "In response to the common assumption of small angle relationships in existing collaborative guidance laws and the neglect of high-order terms in the remaining time expansion, this paper proposes a guidance law structure based on a combination of traditional guidance laws and collaborative correction terms, and uses reinforcement learning methods to train the correction terms. This article also constructs a guided pre training algorithm based on offline reinforcement learning algorithms, combined with the dual delay deep deterministic policy gradient algorithm. Through methods such as delayed updates and critical comparison, fast and efficient learning and training iterations are carried out, effectively solving the problem of overestimation of actions and policies in the reinforcement learning process. The simulation results show that the reinforcement learning collaborative guidance law trained by the designed framework has obvious advantages of wider applicability and higher time collaboration accuracy.",
keywords = "Collaborative guidance, Reinforcement learning, Time collaboration",
author = "Zhenrui Lv and Yifan Hu and Zijing Tian and Bin Fu and Hongguang Ren and Wenxing Fu",
note = "Publisher Copyright: {\textcopyright} Beijing HIWING Scientific and Technological Information Institute 2025.; 4th International Conference on Autonomous Unmanned Systems, ICAUS 2024 ; Conference date: 19-09-2024 Through 21-09-2024",
year = "2025",
doi = "10.1007/978-981-96-3568-9_42",
language = "英语",
isbn = "9789819635672",
series = "Lecture Notes in Electrical Engineering",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "443--453",
editor = "Lianqing Liu and Yifeng Niu and Wenxing Fu and Yi Qu",
booktitle = "Proceedings of 4th 2024 International Conference on Autonomous Unmanned Systems, 4th ICAUS 2024",
}