@inproceedings{6cb55a3de66c4e0d80610e435d8838ea,
title = "Safety-Constrained Reinforcement Learning Method for Urban Eco-Driving",
abstract = "Reinforcement Learning (RL) is used for eco-driving in Intelligent and Connected Vehicles (ICVs), but traditional methods face a critical trade-off. Ensuring safety often requires high penalty terms, leading to overly conservative policies that severely compromise energy and traffic efficiency. To resolve this conflict, this paper introduces the Twin Delayed Deep Deterministic Policy Gradient with Safelayer (TD3+Safelayer), a novel framework that decouples safety from performance objectives. The Safelayer module maps the TD3 policy's actions into a verifiably safe action space. SUMO simulations demonstrate that TD3+Safelayer eliminates all collision events present in the baseline models. While achieving this high level of safety, it also reduces energy consumption by 17.4\% and 30.7\% compared to traditional TD3 and rule-based strategies, respectively.",
keywords = "Eco-driving, Safe Reinforcement Learning, Safelayer, Urban Driving",
author = "Hongwen He and Jiaqi Li and Jingda Wu",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 9th CAA International Conference on Vehicular Control and Intelligence, CVCI 2025 ; Conference date: 24-10-2025 Through 26-10-2025",
year = "2025",
doi = "10.1109/CVCI66304.2025.11348348",
language = "English",
series = "2025 9th CAA International Conference on Vehicular Control and Intelligence, CVCI 2025",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2025 9th CAA International Conference on Vehicular Control and Intelligence, CVCI 2025",
address = "United States",
}