@inproceedings{1c0a7cebbac24d53977755b8f0fa9114,
title = "Weighted Bootstrapped DQN: Efficient Exploration via Uncertainty Quantification",
abstract = "Uncertainty quantification is an essential method for sample-efficient deep reinforcement learning. There is a growing literature on uncertainty-based deep reinforcement learning algorithms, but many of the previous approaches failed to capture different sources of uncertainty. We highlight why this can be a crucial shortcoming for sample-efficient algorithms and provide a sophisticated analysis of the uncertainty in the interaction between agent and environment. Based on that, we propose Weighted Bootstrapped DQN, an exploration-efficient method that combines network ensembles and variance weighting. We use aleatoric uncertainty estimation together with epistemic uncertainty to improve the exploration ability of the algorithm. We prove that our new approach has a significant improvement in sample efficiency on different gym tasks, even compared with the previous state-of-the-art approaches.",
keywords = "Deep Reinforcement Learning, Exploration, Uncertainty Quantification",
author = "Jinhui Pang and Zicong Feng",
note = "Publisher Copyright: {\textcopyright} 2023 SPIE. All rights reserved.; 2023 International Conference on Algorithms, High Performance Computing, and Artificial Intelligence, AHPCAI 2023 ; Conference date: 18-08-2023 Through 19-08-2023",
year = "2023",
doi = "10.1117/12.3012024",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Sandeep Saxena and Cairong Zhao",
booktitle = "International Conference on Algorithms, High Performance Computing, and Artificial Intelligence, AHPCAI 2023",
address = "United States",
}