{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T04:34:43Z","timestamp":1778906083939,"version":"3.51.4"},"reference-count":59,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2023,5,15]],"date-time":"2023-05-15T00:00:00Z","timestamp":1684108800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,5,15]],"date-time":"2023-05-15T00:00:00Z","timestamp":1684108800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Ambient Intell Human Comput"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s12652-023-04630-9","type":"journal-article","created":{"date-parts":[[2023,5,15]],"date-time":"2023-05-15T15:25:45Z","timestamp":1684164345000},"page":"9575-9591","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Deep reinforcement learning-based framework for constrained any-objective optimization"],"prefix":"10.1007","volume":"14","author":[{"given":"Homayoun","family":"Honari","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1937-2328","authenticated-orcid":false,"given":"Saeed","family":"Khodaygan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,5,15]]},"reference":[{"key":"4630_CR1","doi-asserted-by":"publisher","first-page":"1353","DOI":"10.1016\/j.rser.2010.01.006","volume":"14","author":"A Alarcon-Rodriguez","year":"2010","unstructured":"Alarcon-Rodriguez A, Ault G, Galloway S (2010) Multi-objective planning of distributed energy resources: a review of the state-of-the-art. Renew Sustain Energy Rev 14:1353\u20131366","journal-title":"Renew Sustain Energy Rev"},{"key":"4630_CR2","doi-asserted-by":"publisher","first-page":"89497","DOI":"10.1109\/ACCESS.2020.2990567","volume":"8","author":"J Blank","year":"2020","unstructured":"Blank J, Deb K (2020) Pymoo: multi-objective optimization in python. IEEE Access 8:89497\u201389509. https:\/\/doi.org\/10.1109\/ACCESS.2020.2990567","journal-title":"IEEE Access"},{"key":"4630_CR3","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1016\/J.KNOSYS.2015.04.025","volume":"85","author":"D Cai","year":"2015","unstructured":"Cai D, Yuping W (2015) A new uniform evolutionary algorithm based on decomposition and CDAS for many-objective optimization. Knowl Based Syst 85:131\u2013142. https:\/\/doi.org\/10.1016\/J.KNOSYS.2015.04.025","journal-title":"Knowl Based Syst"},{"key":"4630_CR4","doi-asserted-by":"publisher","first-page":"1272","DOI":"10.1016\/J.IFACOL.2016.07.690","volume":"49","author":"G Campos Ciro","year":"2016","unstructured":"Campos Ciro G, Dugardin F, Yalaoui F, Kelly R (2016) A NSGA-II and NSGA-III comparison for solving an open shop scheduling problem with resource constraints. IFAC-PapersOnLine 49:1272\u20131277. https:\/\/doi.org\/10.1016\/J.IFACOL.2016.07.690","journal-title":"IFAC-PapersOnLine"},{"key":"4630_CR5","doi-asserted-by":"publisher","unstructured":"Chen X, Ghadirzadeh A, Bjorkman M, Jensfelt P (2019) Meta-Learning for Multi-objective Reinforcement Learning. IEEE International Conference on Intelligent Robots and Systems 977\u2013983. https:\/\/doi.org\/10.1109\/IROS40897.2019.8968092","DOI":"10.1109\/IROS40897.2019.8968092"},{"key":"4630_CR6","doi-asserted-by":"publisher","first-page":"773","DOI":"10.1109\/TEVC.2016.2519378","volume":"20","author":"R Cheng","year":"2016","unstructured":"Cheng R, Jin Y, Olhofer M, Sendhoff B (2016) A reference vector guided evolutionary algorithm for many-objective optimization. IEEE Trans Evol Comput 20:773\u2013791. https:\/\/doi.org\/10.1109\/TEVC.2016.2519378","journal-title":"IEEE Trans Evol Comput"},{"key":"4630_CR7","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/J.NEUCOM.2016.10.001","volume":"222","author":"T Cheng","year":"2017","unstructured":"Cheng T, Chen M, Fleming PJ et al (2017) A novel hybrid teaching learning based multi-objective particle swarm optimization. Neurocomputing 222:11\u201325. https:\/\/doi.org\/10.1016\/J.NEUCOM.2016.10.001","journal-title":"Neurocomputing"},{"key":"4630_CR8","doi-asserted-by":"publisher","unstructured":"Coello Coello CA, Lechuga MS (2002) MOPSO: a proposal for multiple objective particle swarm optimization. Proceedings of the 2002 Congress on Evolutionary Computation, CEC 2002 2:1051\u20131056. https:\/\/doi.org\/10.1109\/CEC.2002.1004388","DOI":"10.1109\/CEC.2002.1004388"},{"key":"4630_CR9","doi-asserted-by":"publisher","first-page":"182","DOI":"10.1109\/4235.996017","volume":"6","author":"K Deb","year":"2002","unstructured":"Deb K, Pratap A, Agarwal S, Meyarivan T (2002) A fast and elitist multiobjective genetic algorithm: NSGA-II. IEEE Trans Evol Comput 6:182\u2013197. https:\/\/doi.org\/10.1109\/4235.996017","journal-title":"IEEE Trans Evol Comput"},{"key":"4630_CR10","doi-asserted-by":"publisher","first-page":"3364","DOI":"10.1016\/J.RSER.2012.02.071","volume":"16","author":"M Fadaee","year":"2012","unstructured":"Fadaee M, Radzi MAM (2012) Multi-objective optimization of a stand-alone hybrid renewable energy system by using evolutionary algorithms: a review. Renew Sustain Energy Rev 16:3364\u20133369. https:\/\/doi.org\/10.1016\/J.RSER.2012.02.071","journal-title":"Renew Sustain Energy Rev"},{"key":"4630_CR11","doi-asserted-by":"publisher","first-page":"1807082","DOI":"10.1080\/23311916.2020.1807082","volume":"7","author":"JC Ferreira","year":"2020","unstructured":"Ferreira JC, Steiner MTA, Canciglieri Junior O (2020) Multi-objective optimization for the green vehicle routing problem: A systematic literature review and future directions. Cogent Eng 7:1807082. https:\/\/doi.org\/10.1080\/23311916.2020.1807082","journal-title":"Cogent Eng"},{"key":"4630_CR12","doi-asserted-by":"publisher","unstructured":"Fujimoto S, van Hoof H, Meger D (2018) Addressing Function Approximation Error in Actor-Critic Methods. 35th International Conference on Machine Learning, ICML 2018 4:2587\u20132601. https:\/\/doi.org\/10.48550\/arxiv.1802.09477","DOI":"10.48550\/arxiv.1802.09477"},{"key":"4630_CR14","doi-asserted-by":"publisher","first-page":"286","DOI":"10.1016\/J.ASOC.2015.04.061","volume":"34","author":"YJ Gong","year":"2015","unstructured":"Gong YJ, Chen WN, Zhan ZH et al (2015) Distributed evolutionary algorithms and their models: a survey of the state-of-the-art. Appl Soft Comput 34:286\u2013300. https:\/\/doi.org\/10.1016\/J.ASOC.2015.04.061","journal-title":"Appl Soft Comput"},{"key":"4630_CR13","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1016\/J.NEUCOM.2016.09.081","volume":"228","author":"D Gong","year":"2017","unstructured":"Gong D, Sun F, Sun J, Sun X (2017) Set-based many-objective optimization guided by a preferred region. Neurocomputing 228:241\u2013255. https:\/\/doi.org\/10.1016\/J.NEUCOM.2016.09.081","journal-title":"Neurocomputing"},{"key":"4630_CR15","doi-asserted-by":"publisher","first-page":"1502242","DOI":"10.1080\/23311916.2018.1502242","volume":"5","author":"N Gunantara","year":"2018","unstructured":"Gunantara N (2018) A review of multi-objective optimization: methods and its applications. Cogent Eng 5:1502242. https:\/\/doi.org\/10.1080\/23311916.2018.1502242","journal-title":"Cogent Eng"},{"key":"4630_CR16","doi-asserted-by":"publisher","unstructured":"Haarnoja T, Zhou A, Abbeel P, Levine S (2018a) Soft actor-critic: off-policy maximum entropy deep reinforcement learning with a stochastic actor. 35th International Conference on Machine Learning, ICML. 5: 2976\u20132989. https:\/\/doi.org\/10.48550\/arxiv.1801.01290","DOI":"10.48550\/arxiv.1801.01290"},{"key":"4630_CR17","doi-asserted-by":"publisher","unstructured":"Haarnoja T, Zhou A, Hartikainen K, et al (2018b) Soft actor-critic algorithms and applications. https:\/\/doi.org\/10.48550\/arxiv.1812.05905","DOI":"10.48550\/arxiv.1812.05905"},{"key":"4630_CR18","doi-asserted-by":"publisher","unstructured":"Hiroyasu T, Nakayama S, Miki M (2005) Comparison study of SPEA2+, SPEA2, and NSGA-II in diesel engine emissions and fuel economy problem. 2005 IEEE Congress on Evolutionary Computation, IEEE CEC 2005 Proceedings 1: 236\u2013242. https:\/\/doi.org\/10.1109\/CEC.2005.1554690","DOI":"10.1109\/CEC.2005.1554690"},{"key":"4630_CR19","doi-asserted-by":"publisher","first-page":"323","DOI":"10.2478\/JOHH-2018-0006","volume":"66","author":"A Hojjati","year":"2018","unstructured":"Hojjati A, Monadi M, Faridhosseini A, Mohammadi M (2018) Application and comparison of NSGA-II and MOPSO in multi-objective optimization of water resources systems. J Hydrol Hydromech 66:323\u2013329. https:\/\/doi.org\/10.2478\/JOHH-2018-0006","journal-title":"J Hydrol Hydromech"},{"key":"4630_CR20","doi-asserted-by":"publisher","first-page":"3045","DOI":"10.1109\/CEC.2016.7744174","volume":"2016","author":"H Ishibuchi","year":"2016","unstructured":"Ishibuchi H, Imada R, Setoguchi Y, Nojima Y (2016) Performance comparison of NSGA-II and NSGA-III on various many-objective test problems. 2016 IEEE congress on evolutionary computation. CEC 2016:3045\u20133052. https:\/\/doi.org\/10.1109\/CEC.2016.7744174","journal-title":"CEC"},{"key":"4630_CR21","doi-asserted-by":"publisher","unstructured":"Ishibuchi H, Masuda H, Tanigaki Y, Nojima Y (2015) Modified distance calculation in generational distance and inverted generational distance. Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 9019:110\u2013125. https:\/\/doi.org\/10.1007\/978-3-319-15892-1_8\/COVER","DOI":"10.1007\/978-3-319-15892-1_8\/COVER"},{"key":"4630_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/S0377-2217(01)00123-0","volume":"137","author":"DF Jones","year":"2002","unstructured":"Jones DF, Mirrazavi SK, Tamiz M (2002) Multi-objective meta-heuristics: an overview of the current state-of-the-art. Eur J Oper Res 137:1\u20139. https:\/\/doi.org\/10.1016\/S0377-2217(01)00123-0","journal-title":"Eur J Oper Res"},{"key":"4630_CR23","doi-asserted-by":"publisher","DOI":"10.3390\/MA14175109","author":"M Joshi","year":"2021","unstructured":"Joshi M, Ghadai RK, Madhu S et al (2021) Comparison of NSGA-II MOALO and MODA for multi-objective optimization of micro-machining processes. Materials (basel). https:\/\/doi.org\/10.3390\/MA14175109","journal-title":"Materials (basel)"},{"key":"4630_CR24","doi-asserted-by":"publisher","first-page":"485","DOI":"10.4314\/umrj.v16i1","volume":"16","author":"RTFA King","year":"2016","unstructured":"King RTFA, Deb K, Rughooputh HCS (2016) Comparison of NSGA-II and SPEA2 on the multiobjective environmental\/economic dispatch problem. Univ Mauritius Res J 16:485\u2013511. https:\/\/doi.org\/10.4314\/umrj.v16i1","journal-title":"Univ Mauritius Res J"},{"key":"4630_CR25","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2021.3103811","author":"K Li","year":"2021","unstructured":"Li K, Zhang T, Wang R et al (2021) Deep reinforcement learning for combinatorial optimization: covering salesman problems. IEEE Trans Cybern. https:\/\/doi.org\/10.1109\/TCYB.2021.3103811","journal-title":"IEEE Trans Cybern"},{"key":"4630_CR26","doi-asserted-by":"publisher","unstructured":"Lillicrap TP, Hunt JJ, Pritzel A et al (2015) Continuous control with deep reinforcement learning. 4th International Conference on learning representations, ICLR 2016-Conference Track Proceedings. https:\/\/doi.org\/10.48550\/arxiv.1509.02971","DOI":"10.48550\/arxiv.1509.02971"},{"key":"4630_CR27","doi-asserted-by":"publisher","first-page":"306","DOI":"10.1016\/J.KNOSYS.2018.12.001","volume":"165","author":"C Liu","year":"2019","unstructured":"Liu C, Du Y (2019) A membrane algorithm based on chemical reaction optimization for many-objective optimization problems. Knowl Based Syst 165:306\u2013320. https:\/\/doi.org\/10.1016\/J.KNOSYS.2018.12.001","journal-title":"Knowl Based Syst"},{"key":"4630_CR28","doi-asserted-by":"publisher","first-page":"385","DOI":"10.1109\/TSMC.2014.2358639","volume":"45","author":"C Liu","year":"2015","unstructured":"Liu C, Xu X, Hu D (2015) Multiobjective reinforcement learning: a comprehensive overview. IEEE Trans Syst Man Cybern Syst 45:385\u2013398. https:\/\/doi.org\/10.1109\/TSMC.2014.2358639","journal-title":"IEEE Trans Syst Man Cybern Syst"},{"key":"4630_CR29","doi-asserted-by":"publisher","DOI":"10.1016\/J.ENCONMAN.2020.113324","author":"H Liu","year":"2020","unstructured":"Liu H, Li Y, Duan Z, Chen C (2020a) A review on multi-objective optimization framework in wind energy forecasting techniques and applications. Energy Convers Manag. https:\/\/doi.org\/10.1016\/J.ENCONMAN.2020.113324","journal-title":"Energy Convers Manag"},{"key":"4630_CR30","doi-asserted-by":"publisher","first-page":"106382","DOI":"10.1016\/J.ASOC.2020.106382","volume":"93","author":"Q Liu","year":"2020","unstructured":"Liu Q, Li X, Liu H, Guo Z (2020b) Multi-objective metaheuristics for discrete optimization problems: a review of the state-of-the-art. Appl Soft Comput 93:106382. https:\/\/doi.org\/10.1016\/J.ASOC.2020.106382","journal-title":"Appl Soft Comput"},{"key":"4630_CR31","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1016\/J.INS.2020.03.104","volume":"537","author":"S Liu","year":"2020","unstructured":"Liu S, Yu Q, Lin Q, Tan KC (2020c) An adaptive clustering-based evolutionary algorithm for many-objective optimization problems. Inf Sci 537:261\u2013283. https:\/\/doi.org\/10.1016\/J.INS.2020.03.104","journal-title":"Inf Sci"},{"key":"4630_CR33","doi-asserted-by":"publisher","first-page":"7540","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih V, Kavukcuoglu K, Silver D et al (2015) Human-level control through deep reinforcement learning. Nature 518:7540. https:\/\/doi.org\/10.1038\/nature14236","journal-title":"Nature"},{"key":"4630_CR32","doi-asserted-by":"publisher","unstructured":"Mnih V, Kavukcuoglu K, Silver D, et al (2013) Playing Atari with Deep Reinforcement Learning. https:\/\/doi.org\/10.48550\/arxiv.1312.5602","DOI":"10.48550\/arxiv.1312.5602"},{"key":"4630_CR35","doi-asserted-by":"publisher","first-page":"865","DOI":"10.1007\/S12652-019-01598-3\/TABLES\/12","volume":"11","author":"M Mohammadi","year":"2020","unstructured":"Mohammadi M, Khodaygan S (2020) An algorithm for numerical nonlinear optimization: fertile field algorithm (FFA). J Ambient Intell Humaniz Comput 11:865\u2013878. https:\/\/doi.org\/10.1007\/S12652-019-01598-3\/TABLES\/12","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"4630_CR36","doi-asserted-by":"publisher","first-page":"103915","DOI":"10.1016\/J.ENGAPPAI.2020.103915","volume":"96","author":"TT Nguyen","year":"2020","unstructured":"Nguyen TT, Nguyen ND, Vamplew P et al (2020) A multi-objective deep reinforcement learning framework. Eng Appl Artif Intell 96:103915. https:\/\/doi.org\/10.1016\/J.ENGAPPAI.2020.103915","journal-title":"Eng Appl Artif Intell"},{"key":"4630_CR37","doi-asserted-by":"publisher","first-page":"336","DOI":"10.1016\/J.NEUCOM.2012.01.044","volume":"116","author":"B Niu","year":"2013","unstructured":"Niu B, Wang H, Wang J, Tan L (2013) Multi-objective bacterial foraging optimization. Neurocomputing 116:336\u2013345. https:\/\/doi.org\/10.1016\/J.NEUCOM.2012.01.044","journal-title":"Neurocomputing"},{"key":"4630_CR38","doi-asserted-by":"publisher","first-page":"190240","DOI":"10.1109\/ACCESS.2020.3032240","volume":"8","author":"LM Pang","year":"2020","unstructured":"Pang LM, Ishibuchi H, Shang K (2020) NSGA-II with simple modification works well on a wide variety of many-objective problems. IEEE Access 8:190240\u2013190250. https:\/\/doi.org\/10.1109\/ACCESS.2020.3032240","journal-title":"IEEE Access"},{"issue":"187","key":"4630_CR39","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1613\/JAIR.4961","volume":"57","author":"S Parisi","year":"2016","unstructured":"Parisi S, Pirotta M, Restelli M (2016) Multi-objective reinforcement learning through continuous pareto manifold approximation. J Artif Intell Res 57(187):227. https:\/\/doi.org\/10.1613\/JAIR.4961","journal-title":"J Artif Intell Res"},{"key":"4630_CR40","doi-asserted-by":"publisher","unstructured":"Sallam KM, Elsayed SM, Chakrabortty RK, Ryan MJ (2020) Improved Multi-operator Differential Evolution Algorithm for Solving Unconstrained Problems. 2020 IEEE Congress on Evolutionary Computation, CEC 2020 - Conference Proceedings. https:\/\/doi.org\/10.1109\/CEC48606.2020.9185577","DOI":"10.1109\/CEC48606.2020.9185577"},{"key":"4630_CR41","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3105937","author":"Y Shao","year":"2021","unstructured":"Shao Y, Lin JCW, Srivastava G et al (2021) Multi-Objective Neural Evolutionary Algorithm for Combinatorial Optimization Problems. IEEE Trans Neural Netw Learn Syst. https:\/\/doi.org\/10.1109\/TNNLS.2021.3105937","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"4630_CR42","doi-asserted-by":"publisher","unstructured":"Shinde SS, Thangavelu S, Jeyakumar G (2019a) Evolutionary computing approaches for solving multi-objective and many-objective optimization problems: A review. Proceedings - 2019a 5th International Conference on Computing, Communication Control and Automation, ICCUBEA 2019a. https:\/\/doi.org\/10.1109\/ICCUBEA47591.2019.9129081","DOI":"10.1109\/ICCUBEA47591.2019.9129081"},{"key":"4630_CR43","doi-asserted-by":"publisher","unstructured":"Shinde SS, Thangavelu S, Jeyakumar G (2019b) Evolutionary computing approaches for solving multi-objective and many-objective optimization problems: A review. Proceedings - 2019b 5th International Conference on Computing, Communication Control and Automation, ICCUBEA 2019b. https:\/\/doi.org\/10.1109\/ICCUBEA47591.2019.9129081","DOI":"10.1109\/ICCUBEA47591.2019.9129081"},{"key":"4630_CR44","doi-asserted-by":"publisher","first-page":"1841","DOI":"10.1007\/S12652-018-0777-4\/TABLES\/4","volume":"10","author":"SM Sombolestan","year":"2019","unstructured":"Sombolestan SM, Rasooli A, Khodaygan S (2019) Optimal path-planning for mobile robots to find a hidden target in an unknown environment based on machine learning. J Ambient Intell Humaniz Comput 10:1841\u20131850. https:\/\/doi.org\/10.1007\/S12652-018-0777-4\/TABLES\/4","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"4630_CR45","doi-asserted-by":"publisher","unstructured":"Srinivasan S, Ramakrishnan S (2011) Evolutionary multi objective optimization for rule mining: a review. Artif Intell Rev 2011 36:3 36:205\u2013248. https:\/\/doi.org\/10.1007\/S10462-011-9212-3","DOI":"10.1007\/S10462-011-9212-3"},{"key":"4630_CR46","doi-asserted-by":"publisher","unstructured":"Sun Y, Zhang C, Gao L, Wang X (2010) Multi-objective optimization algorithms for flow shop scheduling problem: a review and prospects. Int J Adv Manuf Technol 55:723\u2013739. https:\/\/doi.org\/10.1007\/S00170-010-3094-4","DOI":"10.1007\/S00170-010-3094-4"},{"key":"4630_CR47","unstructured":"Sutton RS, Barto AG (2018) Reinforcement Learning: An Introduction, Second Edition. The MIT Press"},{"key":"4630_CR48","doi-asserted-by":"publisher","first-page":"4951","DOI":"10.1007\/S12652-020-01768-8\/FIGURES\/7","volume":"11","author":"FM Talaat","year":"2020","unstructured":"Talaat FM, Saraya MS, Saleh AI et al (2020) A load balancing and optimization strategy (LBOS) using reinforcement learning in fog computing environment. J Ambient Intell Humaniz Comput 11:4951\u20134966. https:\/\/doi.org\/10.1007\/S12652-020-01768-8\/FIGURES\/7","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"4630_CR49","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1109\/MCI.2017.2742868","volume":"12","author":"Y Tian","year":"2017","unstructured":"Tian Y, Cheng R, Zhang X, Jin Y (2017) PlatEMO: a MATLAB platform for evolutionary multi-objective optimization [Educational Forum]. IEEE Comput Intell Mag 12:73\u201387. https:\/\/doi.org\/10.1109\/MCI.2017.2742868","journal-title":"IEEE Comput Intell Mag"},{"key":"4630_CR51","doi-asserted-by":"publisher","unstructured":"Vamplew P, Yearwood J, Dazeley R, Berry A (2008) On the limitations of scalarisation for multi-objective reinforcement learning of pareto fronts. Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 5360 LNAI: 372\u2013378. https:\/\/doi.org\/10.1007\/978-3-540-89378-3_37\/COVER","DOI":"10.1007\/978-3-540-89378-3_37\/COVER"},{"key":"4630_CR50","doi-asserted-by":"publisher","unstructured":"Vamplew P, Dazeley R, Berry A, et al (2010) Empirical evaluation methods for multiobjective reinforcement learning algorithms. Mach Learn 84: 1 84:51\u201380. https:\/\/doi.org\/10.1007\/S10994-010-5232-5","DOI":"10.1007\/S10994-010-5232-5"},{"key":"4630_CR34","doi-asserted-by":"publisher","first-page":"3483","DOI":"10.5555\/2627435","volume":"15","author":"K van Moffaert","year":"2014","unstructured":"van Moffaert K, Now\u00e9 A (2014) Multi-objective reinforcement learning using sets of pareto dominating policies. J Mach Learn Res 15:3483\u20133512. https:\/\/doi.org\/10.5555\/2627435","journal-title":"J Mach Learn Res"},{"key":"4630_CR52","doi-asserted-by":"crossref","unstructured":"van Veldhuizen DA (1999) Multiobjective Evolutionary Algorithms: classifications, analyses, and new innovations. Storming Media","DOI":"10.1145\/298151.298382"},{"key":"4630_CR53","doi-asserted-by":"publisher","unstructured":"Vesikar Y, Deb K, Blank J (2019) Reference point based NSGA-III for preferred solutions. Proceedings of the 2018 IEEE Symposium Series on Computational Intelligence, SSCI 2018 1587\u20131594. https:\/\/doi.org\/10.1109\/SSCI.2018.8628819","DOI":"10.1109\/SSCI.2018.8628819"},{"key":"4630_CR54","doi-asserted-by":"publisher","first-page":"107526","DOI":"10.1016\/J.KNOSYS.2021.107526","volume":"233","author":"Q Wang","year":"2021","unstructured":"Wang Q, Tang C (2021) Deep reinforcement learning for transportation network combinatorial optimization: a survey. Knowl Based Syst 233:107526. https:\/\/doi.org\/10.1016\/J.KNOSYS.2021.107526","journal-title":"Knowl Based Syst"},{"key":"4630_CR55","doi-asserted-by":"publisher","first-page":"712","DOI":"10.1109\/TEVC.2007.892759","volume":"11","author":"Q Zhang","year":"2007","unstructured":"Zhang Q, Li H (2007) MOEA\/D: a multiobjective evolutionary algorithm based on decomposition. IEEE Trans Evol Comput 11:712\u2013731. https:\/\/doi.org\/10.1109\/TEVC.2007.892759","journal-title":"IEEE Trans Evol Comput"},{"key":"4630_CR56","doi-asserted-by":"publisher","first-page":"418","DOI":"10.1016\/J.EJOR.2021.10.032","volume":"300","author":"Y Zhang","year":"2022","unstructured":"Zhang Y, Bai R, Qu R et al (2022) A deep reinforcement learning based hyper-heuristic for combinatorial optimisation with uncertainties. Eur J Oper Res 300:418\u2013427. https:\/\/doi.org\/10.1016\/J.EJOR.2021.10.032","journal-title":"Eur J Oper Res"},{"key":"4630_CR57","doi-asserted-by":"publisher","first-page":"1030","DOI":"10.1016\/J.INS.2020.08.084","volume":"546","author":"C Zhao","year":"2021","unstructured":"Zhao C, Zhou Y, Chen Z (2021) Decomposition-based evolutionary algorithm with automatic estimation to handle many-objective optimization problem. Inf Sci 546:1030\u20131046. https:\/\/doi.org\/10.1016\/J.INS.2020.08.084","journal-title":"Inf Sci"},{"key":"4630_CR58","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1016\/J.INS.2021.04.050","volume":"571","author":"J Zhou","year":"2021","unstructured":"Zhou J, Zou J, Yang S et al (2021) Niche-based and angle-based selection strategies for many-objective evolutionary optimization. Inf Sci 571:133\u2013153. https:\/\/doi.org\/10.1016\/J.INS.2021.04.050","journal-title":"Inf Sci"},{"key":"4630_CR59","doi-asserted-by":"publisher","first-page":"815","DOI":"10.1016\/J.INS.2020.08.101","volume":"546","author":"F Zou","year":"2021","unstructured":"Zou F, Yen GG, Tang L, Wang C (2021) A reinforcement learning approach for dynamic multi-objective optimization. Inf Sci 546:815\u2013834. https:\/\/doi.org\/10.1016\/J.INS.2020.08.101","journal-title":"Inf Sci"}],"container-title":["Journal of Ambient Intelligence and Humanized Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12652-023-04630-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s12652-023-04630-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12652-023-04630-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,6]],"date-time":"2023-06-06T22:07:18Z","timestamp":1686089238000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s12652-023-04630-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,15]]},"references-count":59,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["4630"],"URL":"https:\/\/doi.org\/10.1007\/s12652-023-04630-9","relation":{},"ISSN":["1868-5137","1868-5145"],"issn-type":[{"value":"1868-5137","type":"print"},{"value":"1868-5145","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,5,15]]},"assertion":[{"value":"16 June 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 May 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 May 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}