{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,23]],"date-time":"2026-01-23T10:46:10Z","timestamp":1769165170781,"version":"3.49.0"},"reference-count":22,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,8,6]],"date-time":"2024-08-06T00:00:00Z","timestamp":1722902400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,8,6]],"date-time":"2024-08-06T00:00:00Z","timestamp":1722902400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,8,6]]},"DOI":"10.1109\/ccece59415.2024.10667211","type":"proceedings-article","created":{"date-parts":[[2024,9,12]],"date-time":"2024-09-12T17:42:46Z","timestamp":1726162966000},"page":"312-318","source":"Crossref","is-referenced-by-count":1,"title":["Sample-Efficient Meta-RL for Traffic Signal Control"],"prefix":"10.1109","author":[{"given":"Xingshuai","family":"Huang","sequence":"first","affiliation":[{"name":"McGill University,Canada"}]},{"given":"Di","family":"Wu","sequence":"additional","affiliation":[{"name":"McGill University,Canada"}]},{"given":"Michael","family":"Jenkin","sequence":"additional","affiliation":[{"name":"York University,Canada"}]},{"given":"Benoit","family":"Boulet","sequence":"additional","affiliation":[{"name":"McGill University,Canada"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220096"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i01.5467"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1609\/icaps.v30i1.6749"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.trc.2022.103955"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i12.26729"},{"key":"ref6","first-page":"1126","article-title":"Model-agnostic meta-learning for fast adaptation of deep networks","volume-title":"International Conference on Machine Learning","author":"Finn"},{"key":"ref7","author":"Hafner","year":"2023","journal-title":"Mastering diverse domains through world models"},{"key":"ref8","article-title":"Transformers are sample efficient world models","volume-title":"International Conference on Learning Representations","author":"Micheli"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-141-3.50030-4"},{"key":"ref10","author":"Qi","year":"2022","journal-title":"Random ensemble reinforcement learning for traffic signal control"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/tkde.2022.3232711"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3233879"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1561\/2200000086"},{"key":"ref14","article-title":"When to trust your model: Model-based policy optimization","volume":"32","author":"Janner","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref15","article-title":"Mastering atari with discrete world models","volume-title":"International Conference on Learning Representations","author":"Hafner"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref17","author":"Robine","year":"2023","journal-title":"Transformer-based world models are happy with 100k interactions"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref19","author":"Zheng","year":"2019","journal-title":"Diagnosing reinforcement learning for traffic signal control"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref21","first-page":"617","article-title":"Model-based reinforcement learning via meta-policy optimization","volume-title":"Conference on Robot Learning","author":"Clavera"},{"key":"ref22","article-title":"Model-based reinforcement learning for atari","volume-title":"International Conference on Learning Representations","author":"Kaiser"}],"event":{"name":"2024 IEEE Canadian Conference on Electrical and Computer Engineering (CCECE)","location":"Kingston, ON, Canada","start":{"date-parts":[[2024,8,6]]},"end":{"date-parts":[[2024,8,9]]}},"container-title":["2024 IEEE Canadian Conference on Electrical and Computer Engineering (CCECE)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10667055\/10667056\/10667211.pdf?arnumber=10667211","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,13]],"date-time":"2024-09-13T05:15:12Z","timestamp":1726204512000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10667211\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,6]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/ccece59415.2024.10667211","relation":{},"subject":[],"published":{"date-parts":[[2024,8,6]]}}}