{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,25]],"date-time":"2026-04-25T10:24:45Z","timestamp":1777112685266,"version":"3.51.4"},"reference-count":53,"publisher":"Springer Science and Business Media LLC","issue":"13","license":[{"start":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T00:00:00Z","timestamp":1754006400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T00:00:00Z","timestamp":1754006400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2025,8]]},"DOI":"10.1007\/s10489-025-06758-x","type":"journal-article","created":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T13:45:10Z","timestamp":1756215910000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Multi-agent neighborhood coordinated and holistic optimized actor-critic framework for adaptive traffic signal control"],"prefix":"10.1007","volume":"55","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-3755-6279","authenticated-orcid":false,"given":"Qi","family":"Deng","sequence":"first","affiliation":[]},{"given":"Lijun","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Zhiyuan","family":"Li","sequence":"additional","affiliation":[]},{"given":"Kaile","family":"Su","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Weiwei","family":"Duan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,26]]},"reference":[{"key":"6758_CR1","doi-asserted-by":"crossref","unstructured":"Haddad TA, Hedjazi D, Aouag S (2022) A deep reinforcement learning-based cooperative approach for multi-intersection traffic signal control. Eng Appl Artif Intell 114","DOI":"10.1016\/j.engappai.2022.105019"},{"key":"6758_CR2","volume-title":"Traffic signal timing manual","author":"P Koonce","year":"2008","unstructured":"Koonce P, Rodegerdts L (2008) Traffic signal timing manual. United States. Federal Highway Administration, Technical report"},{"key":"6758_CR3","unstructured":"Hunt P, Robertson D, Bretherton R, Royle MC (1982) The scoot on-line traffic signal optimisation technique. Traffic Eng Control 23(4)"},{"key":"6758_CR4","unstructured":"PR L (1992) Scats: A traffic responsive method of controlling urban traffic control\/pr lowrie. Roads and Traffic Authority"},{"key":"6758_CR5","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1016\/j.trc.2013.08.014","volume":"36","author":"P Varaiya","year":"2013","unstructured":"Varaiya P (2013) Max pressure control of a network of signalized intersections. Transp Res Part C Emerging Technol 36:177\u2013195","journal-title":"Transp Res Part C Emerging Technol"},{"key":"6758_CR6","doi-asserted-by":"crossref","unstructured":"Cools SB, Gershenson C, D\u2019Hooghe B (2013) Self-organizing traffic lights: A realistic simulation. Adv Appl Self-organizing Syst 45\u201355","DOI":"10.1007\/978-1-4471-5113-5_3"},{"issue":"7","key":"6758_CR7","doi-asserted-by":"publisher","first-page":"6774","DOI":"10.1109\/TITS.2021.3062072","volume":"23","author":"M Wang","year":"2021","unstructured":"Wang M, Wu L, Li J, He L (2021) Traffic signal control with reinforcement learning based on region-aware cooperative strategy. IEEE Trans Intell Transp Syst 23(7):6774\u20136785","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"6758_CR8","doi-asserted-by":"crossref","unstructured":"Wu Q, Wu J, Shen J, Du B, Telikani A, Fahmideh M, Liang C (2022) Distributed agent-based deep reinforcement learning for large scale traffic signal control. Knowl-Based Syst 241","DOI":"10.1016\/j.knosys.2022.108304"},{"issue":"3","key":"6758_CR9","doi-asserted-by":"publisher","first-page":"1086","DOI":"10.1109\/TITS.2019.2901791","volume":"21","author":"T Chu","year":"2019","unstructured":"Chu T, Wang J, Codec\u00e0 L, Li Z (2019) Multi-agent deep reinforcement learning for large-scale traffic signal control. IEEE Trans Intell TranspSyst 21(3):1086\u20131095","journal-title":"IEEE Trans Intell TranspSyst"},{"key":"6758_CR10","first-page":"4079","volume":"33","author":"A Oroojlooy","year":"2020","unstructured":"Oroojlooy A, Nazari M, Hajinezhad D, Silva J (2020) Attendlight: Universal attention-based reinforcement learning model for traffic signal control. Adv Neural Inf Process Syst 33:4079\u20134090","journal-title":"Adv Neural Inf Process Syst"},{"key":"6758_CR11","unstructured":"Chenguang Z, Xiaorong H, Gang W (2021) Prglight: A novel traffic light control framework with pressurebased-reinforcement learning and graph neural network. In: In IJCAI 2021 reinforcement learning for intelligent transportation systems (RL4ITS) Workshop Virtual Aug"},{"key":"6758_CR12","doi-asserted-by":"publisher","first-page":"732","DOI":"10.1016\/j.trc.2017.09.020","volume":"85","author":"M Aslani","year":"2017","unstructured":"Aslani M, Mesgari MS, Wiering M (2017) Adaptive traffic signal control with actor-critic methods in a real-world traffic network with different traffic disruption events. Transp Res Part C Emerging Technol 85:732\u2013752","journal-title":"Transp Res Part C Emerging Technol"},{"issue":"1","key":"6758_CR13","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1109\/TITS.2020.3008612","volume":"23","author":"A Haydari","year":"2020","unstructured":"Haydari A, Y\u0131lmaz Y (2020) Deep reinforcement learning for intelligent transportation systems: A survey. IEEE Trans Intell Transp Syst 23(1):11\u201332","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"6758_CR14","doi-asserted-by":"crossref","unstructured":"Wei H, Chen C, Zheng G, Wu K, Gayah V, Xu K, Li Z (2019) Presslight: Learning max pressure control to coordinate traffic signals in arterial network. In: Proceedings of the 25th ACM SIGKDD international conference on knowledge discovery & data mining, pp 1290\u20131298","DOI":"10.1145\/3292500.3330949"},{"key":"6758_CR15","doi-asserted-by":"crossref","unstructured":"Wei H, Xu N, Zhang H, Zheng G, Zang X, Chen C, Zhang W, Zhu Y, Xu K, Li Z (2019) Colight: Learning network-level cooperation for traffic signal control. In: Proceedings of the 28th ACM international conference on information and knowledge management, pp 1913\u20131922","DOI":"10.1145\/3357384.3357902"},{"key":"6758_CR16","doi-asserted-by":"crossref","unstructured":"Chen C, Wei H, Xu N, Zheng G, Yang M, Xiong Y, Xu K, Li Z (2020) Toward a thousand lights: Decentralized deep reinforcement learning for large-scale traffic signal control. In: Proceedings of the AAAI conference on artificial intelligence, vol 34, pp 3414\u20133421","DOI":"10.1609\/aaai.v34i04.5744"},{"key":"6758_CR17","unstructured":"Zhang L, Wu Q, Shen J, L\u00fc L, Du B, Wu J (2022) Expression might be enough: representing pressure and demand for reinforcement learning based traffic signal control. In: International conference on machine learning, PMLR, pp 26645\u201326654"},{"issue":"3","key":"6758_CR18","doi-asserted-by":"publisher","first-page":"3129","DOI":"10.1109\/TITS.2022.3229477","volume":"24","author":"F Mao","year":"2022","unstructured":"Mao F, Li Z, Lin Y, Li L (2022) Mastering arterial traffic signal control with multi-agent attention-based soft actor-critic model. IEEE Trans Intell Transp Syst 24(3):3129\u20133144","journal-title":"IEEE Trans Intell Transp Syst"},{"issue":"12","key":"6758_CR19","doi-asserted-by":"publisher","first-page":"25157","DOI":"10.1109\/TITS.2022.3173490","volume":"23","author":"C Zhang","year":"2022","unstructured":"Zhang C, Tian Y, Zhang Z, Xue W, Xie X, Yang T, Ge X, Chen R (2022) Neighborhood cooperative multiagent reinforcement learning for adaptive traffic signal control in epidemic regions. IEEE Trans Intell Transp Syst 23(12):25157\u201325168","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"6758_CR20","doi-asserted-by":"crossref","unstructured":"Fang J, You Y, Xu M, Wang J, Cai S (2023) Multi-objective traffic signal control using network-wide agent coordinated reinforcement learning. Expert Syst Appl 120535","DOI":"10.1016\/j.eswa.2023.120535"},{"key":"6758_CR21","doi-asserted-by":"crossref","unstructured":"Ren F, Dong W, Zhao X, Zhang F, Kong Y, Yang Q (2024) Two-layer coordinated reinforcement learning for traffic signal control in traffic network. Expert Syst Appl 235","DOI":"10.1016\/j.eswa.2023.121111"},{"key":"6758_CR22","doi-asserted-by":"publisher","first-page":"128","DOI":"10.1016\/j.future.2021.04.018","volume":"123","author":"Y Zhang","year":"2021","unstructured":"Zhang Y, Zhou Y, Lu H, Fujita H (2021) Cooperative multi-agent actor\u2013critic control of traffic network flow based on edge computing. Futur Gener Comput Syst 123:128\u2013141","journal-title":"Futur Gener Comput Syst"},{"issue":"1","key":"6758_CR23","doi-asserted-by":"publisher","first-page":"174","DOI":"10.1109\/TCYB.2020.3015811","volume":"51","author":"X Wang","year":"2021","unstructured":"Wang X, Ke L, Qiao Z, Chai X (2021) Large-scale traffic signal control using a novel multiagent reinforcement learning. IEEE Trans Cybern 51(1):174\u2013187","journal-title":"IEEE Trans Cybern"},{"issue":"6","key":"6758_CR24","doi-asserted-by":"publisher","first-page":"2687","DOI":"10.1109\/TCYB.2019.2904742","volume":"50","author":"T Tan","year":"2020","unstructured":"Tan T, Bao F, Deng Y, Jin A, Dai Q, Wang J (2020) Cooperative deep reinforcement learning for large-scale traffic grid signal control. IEEE Trans Cybern 50(6):2687\u20132700","journal-title":"IEEE Trans Cybern"},{"key":"6758_CR25","doi-asserted-by":"crossref","unstructured":"Li Z, Wu L, Su K, Wu W, Jing Y, Wu T, Duan W, Yue X, Tong X, Han Y (2024) Coordination as inference in multi-agent reinforcement learning. Neural Netw 172","DOI":"10.1016\/j.neunet.2024.106101"},{"key":"6758_CR26","doi-asserted-by":"crossref","unstructured":"Valiente R, Razzaghpour M, Toghi B, Shah G, Fallah YP (2023) Prediction-aware and reinforcement learning-based altruistic cooperative driving. IEEE Trans Intell Transp Syst","DOI":"10.1109\/TITS.2023.3323440"},{"key":"6758_CR27","unstructured":"Wu Q, Zhang L, Shen J, L\u00fc L, Du B, Wu J (2021) Efficient pressure: Improving efficiency for signalized intersections. arXiv preprint arXiv:2112.02336"},{"key":"6758_CR28","doi-asserted-by":"crossref","unstructured":"Cheng W, Shen Y, Zhu Y, Huang L (2018) A neural attention model for urban air quality inference: Learning the weights of monitoring stations. In: Proceedings of the AAAI conference on artificial intelligence, vol 32","DOI":"10.1609\/aaai.v32i1.11871"},{"key":"6758_CR29","unstructured":"Jiang J, Dun C, Huang T, Lu Z (2018) Graph convolutional reinforcement learning. arXiv preprint arXiv:1810.09202"},{"key":"6758_CR30","unstructured":"Yao H, Tang X, Wei H, Zheng G, Yu Y, Li Z (2018) Modeling spatial-temporal dynamics for traffic prediction. 1(9). arXiv preprint arXiv:1803.01254"},{"key":"6758_CR31","doi-asserted-by":"crossref","unstructured":"Rahmani S, Baghbani A, Bouguila N, Patterson Z (2023) Graph neural networks for intelligent transportation systems: A survey. IEEE Trans Intell Transp Syst","DOI":"10.1109\/TITS.2023.3257759"},{"key":"6758_CR32","unstructured":"Schulman J, Wolski F, Dhariwal P, Radford A, Klimov O (2017) Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347"},{"key":"6758_CR33","first-page":"24611","volume":"35","author":"C Yu","year":"2022","unstructured":"Yu C, Velu A, Vinitsky E, Gao J, Wang Y, Bayen A, Wu Y (2022) The surprising effectiveness of ppo in cooperative multi-agent games. Adv Neural Inf Process Syst 35:24611\u201324624","journal-title":"Adv Neural Inf Process Syst"},{"key":"6758_CR34","unstructured":"Yang Y, Luo R, Li M, Zhou M, Zhang W, Wang J (2018) Mean field multi-agent reinforcement learning. In: International conference on machine learning, PMLR, pp 5571\u20135580"},{"key":"6758_CR35","unstructured":"Guo X, Hu A, Xu R, Zhang J (2019) Learning mean-field games. In: Wallach HM, Larochelle H, Beygelzimer A, d\u2019Alch\u00e9-Buc F, Fox EB, Garnett R (eds) Advances in neural information processing systems 32: Annual conference on neural information processing systems 2019 NeurIPS, 2019 December 8-14 2019 Vancouver BC Canada, pp 4967\u20134977"},{"key":"6758_CR36","doi-asserted-by":"crossref","unstructured":"Gu H, Guo X, Wei X, Xu R (2024) Mean-field multiagent reinforcement learning: A decentralized network approach. Math Oper Res","DOI":"10.1287\/moor.2022.0055"},{"issue":"9","key":"6758_CR37","doi-asserted-by":"publisher","first-page":"1715","DOI":"10.1049\/itr2.12364","volume":"17","author":"T Hu","year":"2023","unstructured":"Hu T, Hu Z, Lu Z, Wen X (2023) Dynamic traffic signal control using mean field multi-agent reinforcement learning in large scale road-networks. IET Intel Transport Syst 17(9):1715\u20131728","journal-title":"IET Intel Transport Syst"},{"issue":"22","key":"6758_CR38","doi-asserted-by":"publisher","first-page":"4686","DOI":"10.3390\/electronics12224686","volume":"12","author":"Z Zhang","year":"2023","unstructured":"Zhang Z, Zhang W, Liu Y, Xiong G (2023) Mean field multi-agent reinforcement learning method for area traffic signal control. Electron 12(22):4686","journal-title":"Electron"},{"issue":"20","key":"6758_CR39","first-page":"10","volume":"1050","author":"P Velickovic","year":"2017","unstructured":"Velickovic P, Cucurull G, Casanova A, Romero A, Lio P, Bengio Y et al (2017) Graph attention networks. Stat 1050(20):10\u201348550","journal-title":"Graph attention networks. Stat"},{"key":"6758_CR40","doi-asserted-by":"crossref","unstructured":"Wei H, Zheng G, Yao H, Li Z (2018) Intellilight: A reinforcement learning approach for intelligent traffic light control. In: Proceedings of the 24th ACM SIGKDD international conference on knowledge discovery & data mining, pp 2496\u20132505","DOI":"10.1145\/3219819.3220096"},{"issue":"3","key":"6758_CR41","doi-asserted-by":"publisher","first-page":"278","DOI":"10.1061\/(ASCE)0733-947X(2003)129:3(278)","volume":"129","author":"B Abdulhai","year":"2003","unstructured":"Abdulhai B, Pringle R, Karakoulas GJ (2003) Reinforcement learning for true adaptive traffic signal control. J Transp Eng 129(3):278\u2013285","journal-title":"J Transp Eng"},{"issue":"2","key":"6758_CR42","doi-asserted-by":"publisher","first-page":"128","DOI":"10.1049\/iet-its.2009.0070","volume":"4","author":"I Arel","year":"2010","unstructured":"Arel I, Liu C, Urbanik T, Kohls AG (2010) Reinforcement learning-based multi-agent system for network traffic signal control. IET Intel Transport Syst 4(2):128\u2013135","journal-title":"IET Intel Transport Syst"},{"key":"6758_CR43","doi-asserted-by":"crossref","unstructured":"Mnih V, Kavukcuoglu K, Silver D, Rusu AA, Veness J, Bellemare MG, Graves A, Riedmiller M, Fidjeland AK, Ostrovski G et al (2015) Human-level control through deep reinforcement learning. Nat 518(7540):529\u2013533","DOI":"10.1038\/nature14236"},{"key":"6758_CR44","doi-asserted-by":"crossref","unstructured":"Zheng G, Xiong Y, Zang X, Feng J, Wei H, Zhang H, Li Y, Xu K, Li Z (2019) Learning phase competition for traffic signal control. In: Proceedings of the 28th ACM international conference on information and knowledge management, pp 1963\u20131972","DOI":"10.1145\/3357384.3357900"},{"key":"6758_CR45","doi-asserted-by":"crossref","unstructured":"Wang T, Zhu Z, Zhang J, Tian J, Zhang W (2024) A large-scale traffic signal control algorithm based on multi-layer graph deep reinforcement learning. Transp Res Part C Emerging Technol 162","DOI":"10.1016\/j.trc.2024.104582"},{"key":"6758_CR46","doi-asserted-by":"crossref","unstructured":"Gu H, Wang S, Ma X, Jia D, Mao G, Lim EG, Wong CPR (2024) Large-scale traffic signal control using constrained network partition and adaptive deep reinforcement learning. IEEE Trans Intell Transp Syst","DOI":"10.1109\/TITS.2024.3352446"},{"key":"6758_CR47","unstructured":"Mnih V, Badia AP, Mirza M, Graves A, Lillicrap T, Harley T, Silver D, Kavukcuoglu K (2016) Asynchronous methods for deep reinforcement learning. In: International Conference on Machine Learning, PMLR, pp 1928\u20131937"},{"key":"6758_CR48","unstructured":"Haarnoja T, Zhou A, Abbeel P, Levine S (2018) Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor. In: International Conference on Machine Learning, PMLR, pp 1861\u20131870"},{"key":"6758_CR49","doi-asserted-by":"crossref","unstructured":"Wei W, Wu Q, Wu J, Du B, Shen J, Li T (2021) Multi-agent deep reinforcement learning for traffic signal control with nash equilibrium. In: 2021 IEEE 23rd Int Conf on high performance computing & communications; 7th int conf on data science & systems; 19th Int Conf on Smart City; 7th Int Conf on dependability in sensor cloud & big data systems & application (HPCC\/DSS\/SmartCity\/DependSys), pp 1435\u20131442","DOI":"10.1109\/HPCC-DSS-SmartCity-DependSys53884.2021.00215"},{"key":"6758_CR50","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wang S, Ma X, Yue W, Jiang R (2023) Large-scale traffic signal control by a nash deep q-network approach. In: 2023 IEEE 26th international conference on intelligent transportation systems (ITSC), pp 4584\u20134591","DOI":"10.1109\/ITSC57777.2023.10422534"},{"issue":"1","key":"6758_CR51","first-page":"229","volume":"2","author":"J-M Lasry","year":"2007","unstructured":"Lasry J-M, Lions P-L (2007) Mean field games. JapanJ Math 2(1):229\u2013260","journal-title":"JapanJ Math"},{"key":"6758_CR52","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser L, Polosukhin I (2017) Attention is all you need. In: Advances in neural information processing systems 30: Annual conference on neural information processing systems, 2017 Long Beach CA USA, pp 5998\u20136008"},{"key":"6758_CR53","doi-asserted-by":"crossref","unstructured":"Mei H, Lei X, Da L, Shi B, Wei H (2023) Libsignal: an open library for traffic signal control. Mach Learn 1\u201337","DOI":"10.1007\/s10994-023-06412-y"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06758-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-025-06758-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06758-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T14:33:50Z","timestamp":1758983630000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-025-06758-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8]]},"references-count":53,"journal-issue":{"issue":"13","published-print":{"date-parts":[[2025,8]]}},"alternative-id":["6758"],"URL":"https:\/\/doi.org\/10.1007\/s10489-025-06758-x","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,8]]},"assertion":[{"value":"25 June 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 August 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}},{"value":"The authors confirm that they have complied with the publication ethics and state that this work is original and has not been used for publication anywhere before.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}}],"article-number":"933"}}