@inproceedings{b18341945ac24c2dbf43b901d1d923e7,
title = "A Deep Reinforcement Learning Method with Action Switching for Autonomous Navigation",
abstract = "Stochastic policy-based deep reinforcement learning (DRL) has successfully gained the widespread application but demands plenty of stochastic exploration to learn the environment at the initial training stage. When the agent is exposed to more complex environment, not only is the methodology inefficient, but its performance may also suffer from the issue of high variance. This paper develops a framework to accelerate the training procedure and reduce the variance by introducing a stochastic switching network, which specifically allows the agent to choose between heuristic actions and actions output by proximal policy optimization (PPO) algorithm. Instead of starting from the random actions, the agent can be effectively guided by the heuristic actions so that the navigation capability of the agent can be rapidly bootstrapped. The vanilla policy gradient (VPG) algorithm is further utilized to train the switching network, which can be jointly trained with the baseline PPO. By the experimental comparison with the baseline PPO in the customized maze environment with openAI Gym toolkit, our method greatly contributes to the more efficient execution of navigation task by means of the heuristic actions for guidance.",
keywords = "Robot navigation, Vanilla policy gradient (VPG), action switching, deep reinforcement learning (DRL), proximal policy optimization (PPO)",
author = "Zuowei Wang and Xiaozhong Liao and Fengdi Zhang and Min Xu and Yanmin Liu and Xiangdong Liu and Xi Zhang and Dong, {Rui Wei} and Zhen Li",
note = "Publisher Copyright: {\textcopyright} 2021 Technical Committee on Control Theory, Chinese Association of Automation.; 40th Chinese Control Conference, CCC 2021 ; Conference date: 26-07-2021 Through 28-07-2021",
year = "2021",
month = jul,
day = "26",
doi = "10.23919/CCC52363.2021.9549631",
language = "English",
series = "Chinese Control Conference, CCC",
publisher = "IEEE Computer Society",
pages = "3491--3496",
editor = "Chen Peng and Jian Sun",
booktitle = "Proceedings of the 40th Chinese Control Conference, CCC 2021",
address = "United States",
}