@inproceedings{757cf954bc4c4ed7b90d0f27807efb5e,
title = "Optimal Policy Replay: A Simple Method to Reduce Catastrophic Forgetting in Target Incremental Visual Navigation",
abstract = "Visual navigation is a critical task in robotics and artificial intelligence. In recent years, reinforcement learning-based approaches have gained popularity for visual navigation. However, existing methods lack flexibility in learning multiple navigation targets and suffer from catastrophic forgetting. To address these challenges, we propose a novel paradigm called 'target incremental visual navigation' and introduce a method called Optimal Policy Replay (OPR). Target incremental visual navigation aims to study the performance of visual navigation in continuous learning of navigation targets. OPR enables continuous learning of navigation targets without the need for relearning all targets. Our method divides the learning process into on-policy and off-policy stages and stores only the optimal experiences in memory. Experimental results show that OPR effectively alleviates catastrophic forgetting and achieves good performance with a small memory size.",
keywords = "catastrophic forgetting, continual learning, reinforcement learning, visual navigation",
author = "Xinting Li and Shizhou Zhang and Yue Lu and Kerry Dang and Lingyan Ran and Peng Wang and Yanning Zhang",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 2023 China Automation Congress, CAC 2023 ; Conference date: 17-11-2023 Through 19-11-2023",
year = "2023",
doi = "10.1109/CAC59555.2023.10450433",
language = "英语",
series = "Proceedings - 2023 China Automation Congress, CAC 2023",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "9201--9206",
booktitle = "Proceedings - 2023 China Automation Congress, CAC 2023",
}