{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T14:29:07Z","timestamp":1754144947843,"version":"3.41.2"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T00:00:00Z","timestamp":1749513600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T00:00:00Z","timestamp":1749513600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100018693","name":"Horizon Europe","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100018693","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100018693","name":"Horizon Europe","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100018693","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,10]]},"DOI":"10.1109\/med64031.2025.11073233","type":"proceedings-article","created":{"date-parts":[[2025,7,15]],"date-time":"2025-07-15T17:39:58Z","timestamp":1752601198000},"page":"405-410","source":"Crossref","is-referenced-by-count":0,"title":["Hierarchical Reinforcement Learning for Optimal EV Charging: A Multi-Level Framework for Dynamic Pricing and Load Scheduling"],"prefix":"10.1109","author":[{"given":"Dimitrios G.","family":"Vamvakas","sequence":"first","affiliation":[{"name":"Informatics &amp; Telematics Institute (I.T.I.), Center for Research and Technology Hellas (CERTH),Greece"}]},{"given":"Christos D.","family":"Korkas","sequence":"additional","affiliation":[{"name":"Informatics &amp; Telematics Institute (I.T.I.), Center for Research and Technology Hellas (CERTH),Greece"}]},{"given":"Christos D.","family":"Tsaknakis","sequence":"additional","affiliation":[{"name":"Informatics &amp; Telematics Institute (I.T.I.), Center for Research and Technology Hellas (CERTH),Greece"}]},{"given":"Elias B.","family":"Kosmatopoulos","sequence":"additional","affiliation":[{"name":"Informatics &amp; Telematics Institute (I.T.I.), Center for Research and Technology Hellas (CERTH),Greece"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.egyr.2020.07.020"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3390\/en16145326"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.buildenv.2021.107952"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MED.2012.6265820"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3041180"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCA.2017.8003180"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijepes.2022.108005"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-08341-9_20"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.116285"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MED.2017.7984164"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/SEGE.2013.6707934"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.3390\/en17153694"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.32657\/10356\/90191"},{"volume-title":"Reinforcement Learning: An Introduction.","year":"2018","author":"Sutton","key":"ref14"},{"issue":"3","key":"ref15","first-page":"729","article-title":"Reinforcement learning","volume":"12","author":"Wiering","year":"2012","journal-title":"Adaptation, learning, and optimization"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/MED59994.2023.10185671"},{"key":"ref17","first-page":"21732","article-title":"Hierarchical reinforcement learning with timed subgoals","volume":"34","author":"Gurtler","year":"2021","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3453160"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v31i1.10916"},{"key":"ref20","article-title":"Hierarchical deep reinforcement learning: Integrating temporal abstraction and intrinsic motivation","volume":"29","author":"Kulkarni","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref21","article-title":"Data-efficient hierarchical reinforcement learning","volume":"31","author":"Nachum","year":"2018","journal-title":"Advances in neural information processing systems"},{"article-title":"Meta learning shared hierarchies","year":"2017","author":"Frans","key":"ref22"},{"issue":"268","key":"ref23","first-page":"1","article-title":"Stable-baselines3: Reliable reinforcement learning implementations","volume":"22","author":"Raffin","year":"2021","journal-title":"Journal of Machine Learning Research"},{"key":"ref24","first-page":"3540","article-title":"FeUdal networks for hierarchical reinforcement learning","volume-title":"Proceedings of the 34th International Conference on Machine Learning","volume":"70","author":"Vezhnevets"}],"event":{"name":"2025 33rd Mediterranean Conference on Control and Automation (MED)","start":{"date-parts":[[2025,6,10]]},"location":"Tangier, Morocco","end":{"date-parts":[[2025,6,13]]}},"container-title":["2025 33rd Mediterranean Conference on Control and Automation (MED)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11073126\/11073191\/11073233.pdf?arnumber=11073233","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T05:50:40Z","timestamp":1752645040000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11073233\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,10]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/med64031.2025.11073233","relation":{},"subject":[],"published":{"date-parts":[[2025,6,10]]}}}