{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T18:51:10Z","timestamp":1764874270182,"version":"3.46.0"},"reference-count":54,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2024YFC3308200"],"award-info":[{"award-number":["2024YFC3308200"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62525606","62406303"],"award-info":[{"award-number":["62525606","62406303"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003995","name":"Natural Science Foundation of Anhui Province","doi-asserted-by":"publisher","award":["2308085MG226","2308085QF229"],"award-info":[{"award-number":["2308085MG226","2308085QF229"]}],"id":[{"id":"10.13039\/501100003995","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Mobile Comput."],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1109\/tmc.2025.3600533","type":"journal-article","created":{"date-parts":[[2025,8,19]],"date-time":"2025-08-19T18:17:54Z","timestamp":1755627474000},"page":"1122-1136","source":"Crossref","is-referenced-by-count":0,"title":["$\\pi$-eLight: Learning Interpretable Programmatic Policies for Effective Traffic Signal Control"],"prefix":"10.1109","volume":"25","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6734-9085","authenticated-orcid":false,"given":"Yin","family":"Gu","sequence":"first","affiliation":[{"name":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5335-2470","authenticated-orcid":false,"given":"Kai","family":"Zhang","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6956-5550","authenticated-orcid":false,"given":"Qi","family":"Liu","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cognitive Intelligence, University of Science and Technology of China, Hefei, China"}]},{"given":"Haojie","family":"Yuan","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China, Hefei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4080-2377","authenticated-orcid":false,"given":"Runlong","family":"Yu","sequence":"additional","affiliation":[{"name":"Department of Computer Science, University of Pittsburgh, Pittsburgh, PA, USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2024.3462153"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1057\/jors.1963.61"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4471-5113-5_3"},{"article-title":"SCATS, sydney co-ordinated adaptive traffic system: A traffic responsive method of controlling urban traffic","year":"1990","author":"Lowrie","key":"ref4"},{"key":"ref5","first-page":"21","article-title":"Coordinated deep reinforcement learners for traffic light control","volume-title":"Proc. Learn. Inference Control Multi-Agent Syst.","author":"Van der Pol"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220096"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5744"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1049\/iet-its.2017.0153"},{"key":"ref9","first-page":"4079","article-title":"Attendlight: Universal attention-based reinforcement learning model for traffic signal control","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Oroojlooy"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3357902"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2020.3033782"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2023.3332081"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2020\/345"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3233879"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/c2017-0-02878-1"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-019-0048-x"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2023.3297026"},{"article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and Huffman coding","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Han","key":"ref18"},{"article-title":"Quantizing deep convolutional networks for efficient inference: A whitepaper","year":"2018","author":"Krishnamoorthi","key":"ref19"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-6243-9_2"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i19.30103"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3357900"},{"key":"ref23","first-page":"88","article-title":"Learning an interpretable traffic signal control policy","volume-title":"Proc. 19th Int. Conf. Auton. Agents MultiAgent Syst.","author":"Ault"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3638529.3654037"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3690624.3709379"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1093\/cid\/ciad633"},{"journal-title":"Trans. Mach. Learn. Res","article-title":"Generating with confidence: Uncertainty quantification for black-box large language models","author":"Lin","key":"ref28"},{"key":"ref29","first-page":"13027","article-title":"EcoLight: Intersection control in developing regions under extreme budget and network constraints","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Chauhan"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2022\/555"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2024.3403879"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2024.3377106"},{"article-title":"X-light: Cross-city traffic signal control using transformer on transformer as meta multi-agent reinforcement learner","year":"2024","author":"Jiang","key":"ref33"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i01.5467"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3340531.3411859"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-024-06543-w"},{"key":"ref37","first-page":"503","article-title":"Tree-based batch mode reinforcement learning","volume":"6","author":"Ernst","year":"2005","journal-title":"J. Mach. Learn. Res."},{"article-title":"Verifiable reinforcement learning via policy extraction","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Bastani","key":"ref38"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i06.6587"},{"key":"ref40","first-page":"5045","article-title":"Programmatically interpretable reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Verma"},{"article-title":"Imitation-projected programmatic reinforcement learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Verma","key":"ref41"},{"key":"ref42","first-page":"5979","article-title":"Discovering symbolic policies with deep reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Landajuela"},{"key":"ref43","first-page":"25146","article-title":"Learning to synthesize programs as interpretable and generalizable policies","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Trivedi"},{"article-title":"Programmatic reinforcement learning without Oracles","volume-title":"Proc. 10th Int. Conf. Learn. Representations","author":"Qiu","key":"ref44"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2022.XVIII.068"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/3447556.3447565"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-75538-8_7"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1038\/nature24270"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-022-05172-4"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1007\/11871842_29"},{"key":"ref51","first-page":"2951","article-title":"Practical Bayesian optimization of machine learning algorithms","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Snoek"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1145\/3308558.3314139"},{"article-title":"Soft actor-critic algorithms and applications","year":"2018","author":"Haarnoja","key":"ref53"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/3603171"}],"container-title":["IEEE Transactions on Mobile Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7755\/11275706\/11130361.pdf?arnumber=11130361","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T18:39:38Z","timestamp":1764873578000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11130361\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1]]},"references-count":54,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/tmc.2025.3600533","relation":{},"ISSN":["1536-1233","1558-0660","2161-9875"],"issn-type":[{"type":"print","value":"1536-1233"},{"type":"electronic","value":"1558-0660"},{"type":"electronic","value":"2161-9875"}],"subject":[],"published":{"date-parts":[[2026,1]]}}}