{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T21:15:47Z","timestamp":1725743747809},"reference-count":22,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,7,26]],"date-time":"2021-07-26T00:00:00Z","timestamp":1627257600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,7,26]],"date-time":"2021-07-26T00:00:00Z","timestamp":1627257600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,7,26]],"date-time":"2021-07-26T00:00:00Z","timestamp":1627257600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,7,26]]},"DOI":"10.1109\/tsp52935.2021.9522612","type":"proceedings-article","created":{"date-parts":[[2021,8,30]],"date-time":"2021-08-30T23:12:50Z","timestamp":1630365170000},"page":"62-65","source":"Crossref","is-referenced-by-count":0,"title":["ReLight-WCTM: Multi-Agent Reinforcement Learning Approach for Traffic Light Control within a Realistic Traffic Simulation"],"prefix":"10.1109","author":[{"given":"Peter","family":"Palos","sequence":"first","affiliation":[]},{"given":"Arpad","family":"Huszak","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"Deep reinforcement learning for coordination in traffic light control","author":"van der pol","year":"2016","journal-title":"Vrije University Amsterdam"},{"article-title":"Dueling network architectures for deep reinforcement learning","year":"2015","author":"wang","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.3390\/e21080773"},{"key":"ref13","article-title":"Learning from Delayed Rewards","author":"watkins","year":"1989","journal-title":"Cambridge University"},{"article-title":"Asynchronous Methods for Deep Reinforcement Learning","year":"2016","author":"mnih","key":"ref14"},{"article-title":"Playing Atari with Deep Reinforcement Learning","year":"2013","author":"mnih","key":"ref15"},{"key":"ref16","article-title":"Decentralized Multi-Agent Solutions in Traffic Management","author":"p\u00e1los","year":"2020","journal-title":"Budapest University of Technology and Economics"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCC.2007.913919"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2018.8569938"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1049\/iet-its.2017.0153"},{"key":"ref4","article-title":"Scats, sydney co-ordinated adaptive traffic system: A traffic responsive method of controlling urban traffic","author":"lowrie","year":"1990","journal-title":"Roads and Traffic Authority NSW"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-6243-9_2"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2011.6083114"},{"key":"ref5","article-title":"SCOOT-a traffic responsive method of coordinating signals","author":"hunt","year":"1981","journal-title":"Transport Research Laboratory"},{"key":"ref8","first-page":"247","article-title":"Traffic signal timing via deep reinforcement learning","author":"li","year":"2016","journal-title":"IEEE\/CAA Journal of Automatica"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2013.6728404"},{"key":"ref2","article-title":"Traffic Signal Timing Manual","author":"koonce","year":"2008","journal-title":"United States Federal Highway Administration"},{"journal-title":"Traffic Engineering","year":"2004","author":"roess","key":"ref1"},{"key":"ref9","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v30i1.10295","article-title":"Deep reinforcement learning with double q-learning","author":"van hasselt","year":"2016","journal-title":"Conference on Artificial Intelligence"},{"article-title":"Integrating independent and centralized multi-agent reinforcement learning for traffic signal network optimization","year":"2019","author":"zhang","key":"ref20"},{"article-title":"Reinforcement Learning for Traffic Optimization","year":"2016","author":"stevens","key":"ref22"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.3141\/2355-02"}],"event":{"name":"2021 44th International Conference on Telecommunications and Signal Processing (TSP)","start":{"date-parts":[[2021,7,26]]},"location":"Brno, Czech Republic","end":{"date-parts":[[2021,7,28]]}},"container-title":["2021 44th International Conference on Telecommunications and Signal Processing (TSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9522010\/9522587\/09522612.pdf?arnumber=9522612","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,8]],"date-time":"2023-01-08T09:00:10Z","timestamp":1673168410000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9522612\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,26]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/tsp52935.2021.9522612","relation":{},"subject":[],"published":{"date-parts":[[2021,7,26]]}}}