@article{M859E8F4E, title = "Autonomous Driving Strategy for Bottleneck Traffic with Prioritized Experience Replay", journal = "The Journal of Korean Institute of Communications and Information Sciences", year = "2023", issn = "1226-4717", doi = "10.7840/kics.2023.48.6.690", author = "Chanin Eom, Dongsu Lee, Minhae Kwon", keywords = "Autonomous driving system, Bottleneck traffic, Deep reinforcement learning, Partially observable Markov decision process, Twin delayed deep deterministic policy gradient, Prioritized experience replay", abstract = "Recently, the demand for a higher level of autonomous driving technology in complex circumstances has increased. Deep reinforcement learning is gaining attention as a promising solution that enables instant decision-making based on high-dimensional state information. In this study, we propose a Partially Observable Markov Decision Process (POMDP) to train the autonomous driving policy that can successfully navigate bottleneck congestion. Furthermore, we suggest using the prioritized experience replay method in Twin Delayed Deep Deterministic Policy Gradient (TD3) to train the policy. As a result, we confirm that the vehicles trained with the prioritized experience replay method outperform the vehicles trained with the random experience replay method." }