{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,20]],"date-time":"2026-06-20T16:29:37Z","timestamp":1781972977409,"version":"3.54.5"},"reference-count":189,"publisher":"Informa UK Limited","issue":"20","license":[{"start":{"date-parts":[[2022,11,3]],"date-time":"2022-11-03T00:00:00Z","timestamp":1667433600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["www.tandfonline.com"],"crossmark-restriction":true},"short-container-title":["International Journal of Production Research"],"published-print":{"date-parts":[[2023,10,18]]},"DOI":"10.1080\/00207543.2022.2140221","type":"journal-article","created":{"date-parts":[[2022,11,3]],"date-time":"2022-11-03T13:43:45Z","timestamp":1667483025000},"page":"7151-7179","update-policy":"https:\/\/doi.org\/10.1080\/tandf_crossmark_01","source":"Crossref","is-referenced-by-count":277,"title":["A review on reinforcement learning algorithms and applications in supply chain management"],"prefix":"10.1080","volume":"61","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5454-8894","authenticated-orcid":false,"given":"Benjamin","family":"Rolf","sequence":"first","affiliation":[{"name":"Otto-von-Guericke-University Magdeburg","place":["Magdeburg, Germany"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7457-6040","authenticated-orcid":false,"given":"Ilya","family":"Jackson","sequence":"additional","affiliation":[{"name":"Center for Transportation & Logistics","place":["Cambridge, USA"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9865-7331","authenticated-orcid":false,"given":"Marcel","family":"M\u00fcller","sequence":"additional","affiliation":[{"name":"Otto-von-Guericke-University Magdeburg","place":["Magdeburg, Germany"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3397-1551","authenticated-orcid":false,"given":"Sebastian","family":"Lang","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Factory Operation and Automation IFF","place":["Magdeburg, Germany"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3001-9821","authenticated-orcid":false,"given":"Tobias","family":"Reggelin","sequence":"additional","affiliation":[{"name":"Otto-von-Guericke-University Magdeburg","place":["Magdeburg, Germany"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dmitry","family":"Ivanov","sequence":"additional","affiliation":[{"name":"Berlin School of Economics and Law","place":["Berlin, Germany"]}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"301","published-online":{"date-parts":[[2022,11,3]]},"reference":[{"key":"e_1_3_3_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2021.08.004"},{"key":"e_1_3_3_3_1","unstructured":"Achiam J. 2018. \u201cOpenAI Spinning up. GitHub Repository.\u201d Accessed 16 February 2022. https:\/\/spinningup.openai.com\/."},{"key":"e_1_3_3_4_1","doi-asserted-by":"publisher","DOI":"10.3390\/pr9101728"},{"key":"e_1_3_3_5_1","unstructured":"Adi T. N. Y. A. Iskandar H. Bae and Y. Choi. 2020. \u201cReduction of Number of Empty-Truck Trips in Inter-Terminal Transportation Using Multi-agent Q-learning.\u201d In Interconnected Supply Chains in An Era of Innovation \u2013 Proceedings of the 8th International Conference on Information Systems Logistics and Supply Chain ILS 2020 Austin TX USA 167\u2013172."},{"issue":"6","key":"e_1_3_3_6_1","first-page":"3780","article-title":"Simulation-Based Optimization of a Stochastic Supply Chain Considering Supplier Disruption: Agent-Based Modeling and Reinforcement Learning","volume":"26","author":"Aghaie A.","year":"2019","unstructured":"Aghaie, A., and M. H. Heidary. 2019. \u201cSimulation-Based Optimization of a Stochastic Supply Chain Considering Supplier Disruption: Agent-Based Modeling and Reinforcement Learning.\u201d Scientia Iranica26 (6): 3780\u20133795.","journal-title":"Scientia Iranica"},{"key":"e_1_3_3_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10845-011-0580-y"},{"key":"e_1_3_3_8_1","doi-asserted-by":"crossref","unstructured":"Alves J. C. and G. R. Mateus. 2020. \u201cDeep Reinforcement Learning and Optimization Approach for Multi-echelon Supply Chain with Uncertain Demands.\u201d Lecture Notes in Computer Science (Including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 12433 LNCS 584\u2013599. Berlin Heidelberg: Springer.","DOI":"10.1007\/978-3-030-59747-4_38"},{"key":"e_1_3_3_9_1","doi-asserted-by":"crossref","unstructured":"Back J.-G. C. O. Kim and I.-H. Kwon. 2006. \u201cAn Adaptive Inventory Control Model for a Supply Chain with Nonstationary Customer Demands.\u201d Lecture Notes in Computer Science (including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 4099 LNAI 895\u2013900. Berlin Heidelberg: Springer.","DOI":"10.1007\/978-3-540-36668-3_102"},{"key":"e_1_3_3_10_1","doi-asserted-by":"publisher","DOI":"10.1016\/b978-1-55860-377-6.50013-x"},{"key":"e_1_3_3_11_1","unstructured":"Barat S. H. Khadilkar H. Meisheri V. Kulkarni V. Baniwal P. Kumar and M. Gajrani. 2019. \u201cActor Based Simulation for Closed Loop Control of Supply Chain Using Reinforcement Learning.\u201d In Proceedings of the International Joint Conference on Autonomous Agents and Multiagent Systems AAMAS Montreal QC Canada 1802\u20131804. Vol. 3."},{"key":"e_1_3_3_12_1","doi-asserted-by":"crossref","unstructured":"Barat S. P. Kumar M. Gajrani H. Khadilkar H. Meisheri V. Baniwal and V. Kulkarni. 2020. \"Reinforcement Learning of Supply Chain Control Policy Using Closed Loop Multi-agent Simulation.\u201d Lecture Notes in Computer Science (Including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 12025 LNAI 26\u201338. Cham: Springer.","DOI":"10.1007\/978-3-030-60843-9_3"},{"key":"e_1_3_3_13_1","unstructured":"Bengio Yoshua. 2016. Deep Learning. Adaptive Computation and Machine Learning Series. London England: MIT Press."},{"key":"e_1_3_3_14_1","doi-asserted-by":"crossref","unstructured":"Bharti S. D. S. Kurian and V. M. Pillai. 2020. \u201cReinforcement Learning for Inventory Management.\u201d Lecture Notes in Mechanical Engineering 877\u2013885. Singapore: Springer.","DOI":"10.1007\/978-981-15-2696-1_85"},{"key":"e_1_3_3_15_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2021.07.016"},{"key":"e_1_3_3_16_1","unstructured":"Braunschweig Katrin Julian Eberius Maik Thiele and Wolfgang Lehner. 2012. \u201cThe State of Open Data \u2013 Limits of Current Open Data Platforms.\u201d In WWW '12: Proceedings of the 21st International Conference on World Wide Web Lyon France."},{"key":"e_1_3_3_17_1","unstructured":"Bretas A. A. Mendes S. Chalup M. Jackson R. Clement and C. Sanhueza. 2019. \u201cModelling Railway Traffic Management Through Multi-agent Systems and Reinforcement Learning.\u201d In 23rd International Congress on Modelling and Simulation \u2013 Supporting Evidence-Based Decision Making: The Role of Modelling and Simulation MODSIM 2019 Canberra Australia 291\u2013297."},{"key":"e_1_3_3_18_1","doi-asserted-by":"publisher","DOI":"10.1057\/s11369-021-00224-5"},{"key":"e_1_3_3_19_1","first-page":"31","article-title":"Effect of Reinforcement Learning on Coordination of Multiagent Systems","volume":"4208","author":"Bukkapatnam S.","year":"2000","unstructured":"Bukkapatnam, S., and G. Gao. 2000. \u201cEffect of Reinforcement Learning on Coordination of Multiagent Systems.\u201d Proceedings of SPIE \u2013 The International Society for Optical Engineering 4208: 31\u201341.","journal-title":"Proceedings of SPIE \u2013 The International Society for Optical Engineering"},{"key":"e_1_3_3_20_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.tre.2021.102412"},{"key":"e_1_3_3_21_1","doi-asserted-by":"crossref","unstructured":"Cao H. H. Xi and S. F. Smith. 2003. \u201cA Reinforcement Learning Approach to Production Planning in the Fabrication\/fulfillment Manufacturing Process.\u201d In Winter Simulation Conference Proceedings New Orleans LA USA 1417\u20131423. Vol. 2.","DOI":"10.1109\/WSC.2003.1261584"},{"key":"e_1_3_3_22_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijinfomgt.2019.03.004"},{"key":"e_1_3_3_23_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.dss.2008.03.007"},{"key":"e_1_3_3_24_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-40864-9_2"},{"key":"e_1_3_3_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3062410"},{"key":"e_1_3_3_26_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2020.1733125"},{"key":"e_1_3_3_27_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-19931-8_11"},{"key":"e_1_3_3_28_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10479-022-04536-3"},{"key":"e_1_3_3_29_1","volume-title":"Supply Chain Management: Strategy, Planning, and Operation","author":"Chopra Sunil","year":"2013","unstructured":"Chopra, Sunil, and P. Meindl. 2013. Supply Chain Management: Strategy, Planning, and Operation. 5th ed. Boston: Pearson Education.","edition":"5"},{"issue":"1","key":"e_1_3_3_30_1","first-page":"53","article-title":"Managing Risk to Avoid Supply-Chain Breakdown","volume":"46","author":"Chopra Sunil","year":"2004","unstructured":"Chopra, Sunil, and Man Mohan S. Sodhi. 2004. \u201cManaging Risk to Avoid Supply-Chain Breakdown.\u201d MIT Sloan Management Review 46 (1): 53\u201361.","journal-title":"MIT Sloan Management Review"},{"key":"e_1_3_3_31_1","unstructured":"Collins John Raghu Arunachalam Norman Sadeh Joakim Eriksson Niclas Finne and Sverker Janson. 2006. \u201cThe Supply Chain Management Game for the 2007 Trading Agent Competition.\u201d http:\/\/reports-archive.adm.cs.cmu.edu\/anon\/isri2007\/CMU-ISRI-07-100.pdf."},{"key":"e_1_3_3_32_1","unstructured":"Craven T. J. and C. C. Krejci. 2016. \u201cAssessing Management Strategies for Intermediated Regional Food Supply Networks.\u201d In 2016 International Annual Conference of the American Society for Engineering Management ASEM 2016 Charlotte North Carolina USA 21\u201348."},{"key":"e_1_3_3_33_1","unstructured":"Craven T. J. and C. C. Krejci. 2017. \u201cAn Agent-Based Model of Regional Food Supply Chain Disintermediation.\u201d In ADS '17: Proceedings of the Agent-Directed Simulation Symposium Virginia Beach Virginia USA 83\u201392. Vol. 49."},{"key":"e_1_3_3_34_1","doi-asserted-by":"crossref","unstructured":"Dahlem D. and W. Harrison. 2010. \u201cCollaborative Function Approximation in Social Multiagent Systems.\u201d In Proceedings \u2013 2010 IEEE\/WIC\/ACM International Conference on Intelligent Agent Technology IAT 2010 Washington DC USA 48\u201355. Vol. 2.","DOI":"10.1109\/WI-IAT.2010.276"},{"key":"e_1_3_3_35_1","doi-asserted-by":"crossref","unstructured":"Dangelmaier W. T. Rust A. D\u00f6ring and B. Kl\u00f6pper. 2006. \u201cA Reinforcement Learning Approach for Learning Coordination Rules in Production Networks.\u201d In CIMCA 2006: International Conference on Computational Intelligence for Modelling Control and Automation Jointly with IAWTIC 2006: International Conference on Intelligent Agents Web Technologies Sydney Australia 84.","DOI":"10.1109\/CIMCA.2006.25"},{"key":"e_1_3_3_36_1","doi-asserted-by":"publisher","DOI":"10.1287\/mnsc.45.4.560"},{"key":"e_1_3_3_37_1","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.2.271"},{"key":"e_1_3_3_38_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2016.03.019"},{"key":"e_1_3_3_39_1","unstructured":"DispoWeb. 2004. \u201cDispositive Supply Web Coordination with Multi-Agent Systems.\u201d https:\/\/www.aot.tu-berlin.de\/index.php?id=1764&L=1."},{"key":"e_1_3_3_40_1","doi-asserted-by":"publisher","DOI":"10.1111\/exsy.12054"},{"key":"e_1_3_3_41_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2021.2002969"},{"key":"e_1_3_3_42_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2019.1627438"},{"key":"e_1_3_3_43_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2020.1774679"},{"key":"e_1_3_3_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2911620"},{"key":"e_1_3_3_45_1","doi-asserted-by":"publisher","DOI":"10.1142\/S021962201950038X"},{"key":"e_1_3_3_46_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2008.11.007"},{"key":"e_1_3_3_47_1","doi-asserted-by":"crossref","unstructured":"Filatova D. C. El-Nouty and R. V. Fedorenko. 2021. \u201cSome Theoretical Backgrounds for Reinforcement Learning Model of Supply Chain Management Under Stochastic Demand.\u201d In International Conference on Information and Digital Technologies 2021 IDT 2021 Zilina Slovakia 24\u201330.","DOI":"10.1109\/IDT52577.2021.9497569"},{"key":"e_1_3_3_48_1","doi-asserted-by":"crossref","unstructured":"Fleischmann Bernhard Herbert Meyr and Michael Wagner. 2008. \u201cAdvanced Planning.\u201d In Supply Chain Management and Advanced Planning edited by Hartmut Stadtler and Christoph Kilger 81\u2013106. Berlin Heidelberg: Springer.","DOI":"10.1007\/3-540-24814-5_5"},{"key":"e_1_3_3_49_1","doi-asserted-by":"crossref","unstructured":"Ganesan V. K. D. Sundararaj and A. P. Srinivas. 2021. \u201cAdaptive Inventory Replenishment for Dynamic Supply Chains with Uncertain Market Demand.\u201d Lecture Notes in Mechanical Engineering 325\u2013335. Singapore: Springer.","DOI":"10.1007\/978-981-15-5689-0_28"},{"key":"e_1_3_3_50_1","doi-asserted-by":"crossref","unstructured":"Gang Z. and S. Ruoying. 2006. \u201cPolicy Transition of Reinforcement Learning for An Agent Based SCM System.\u201d In 2006 IEEE International Conference on Industrial Informatics INDIN'06 Singapore 793\u2013798.","DOI":"10.1109\/INDIN.2006.275663"},{"key":"e_1_3_3_51_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12599-019-00583-6"},{"key":"e_1_3_3_52_1","doi-asserted-by":"publisher","DOI":"10.1561\/2200000049"},{"key":"e_1_3_3_53_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2015.06.224"},{"key":"e_1_3_3_54_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0925-5273(00)00156-0"},{"key":"e_1_3_3_55_1","doi-asserted-by":"publisher","DOI":"10.1287\/mnsc.41.2.263"},{"key":"e_1_3_3_56_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2019.06.015"},{"key":"e_1_3_3_57_1","doi-asserted-by":"crossref","unstructured":"Gu Shixiang Ethan Holly Timothy Lillicrap and Sergey Levine. May 2017. \u201cDeep Reinforcement Learning for Robotic Manipulation with Asynchronous Off-policy Updates.\u201d In 2017 IEEE International Conference on Robotics and Automation (ICRA). IEEE.","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"e_1_3_3_58_1","doi-asserted-by":"publisher","DOI":"10.3390\/su13116230"},{"key":"e_1_3_3_59_1","doi-asserted-by":"crossref","unstructured":"Habib A. M. I. Khan and J. Uddin. 2017. \u201cOptimal Route Selection in Complex Multi-Stage Supply Chain Networks Using SARSA(\u03bb).\u201d In 19th International Conference on Computer and Information Technology ICCIT 2016 Dhaka Bangladesh 170\u2013175.","DOI":"10.1109\/ICCITECHN.2016.7860190"},{"key":"e_1_3_3_60_1","doi-asserted-by":"crossref","unstructured":"Hachaichi Y. Y. Chemingui and M. Affes. 2020. \u201cA Policy Gradient Based Reinforcement Learning Method for Supply Chain Management.\u201d In Proceedings of the International Conference on Advanced Systems and Emergent Technologies IC_ASET 2020 Tunis Tunisia 135\u2013140.","DOI":"10.1109\/IC_ASET49463.2020.9318258"},{"key":"e_1_3_3_61_1","volume-title":"Production and Inventory Management","author":"Hax Arnoldo C.","year":"1984","unstructured":"Hax, Arnoldo C., and Dan Candea. 1984. Production and Inventory Management. Englewood Cliffs: Prentice-Hall."},{"key":"e_1_3_3_62_1","doi-asserted-by":"crossref","unstructured":"Hirano M. H. Matsushima K. Izumi and T. Mukai. 2021. \u201cSimulation of Unintentional Collusion Caused by Auto Pricing in Supply Chain Markets.\u201d Lecture Notes in Computer Science (Including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 12568 LNAI 352\u2013359. Cham: Springer.","DOI":"10.1007\/978-3-030-69322-0_24"},{"key":"e_1_3_3_63_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2021.1953180"},{"key":"e_1_3_3_64_1","doi-asserted-by":"publisher","DOI":"10.1155\/2021\/9919399"},{"key":"e_1_3_3_65_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-444-64235-6.50063-2"},{"key":"e_1_3_3_66_1","volume-title":"Forecasting: Principles and Practice","author":"Hyndman Rob J.","year":"2018","unstructured":"Hyndman, Rob J., and George Athanasopoulos. 2018. Forecasting: Principles and Practice. 2nd ed. Melbourne: OTexts.","edition":"2"},{"key":"e_1_3_3_67_1","unstructured":"Instacart. 2017. \u201cInstacart Market Basket Analysis.\u201d https:\/\/www.kaggle.com\/competitions\/instacart-market-basket-analysis\/overview."},{"key":"e_1_3_3_68_1","doi-asserted-by":"crossref","unstructured":"Isele David Reza Rahimi Akansel Cosgun Kaushik Subramanian and Kikuo Fujimura. May 2018. \u201cNavigating Occluded Intersections with Autonomous Vehicles Using Deep Reinforcement Learning.\u201d In 2018 IEEE International Conference on Robotics and Automation (ICRA). IEEE.","DOI":"10.1109\/ICRA.2018.8461233"},{"key":"e_1_3_3_69_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2019.1634850"},{"key":"e_1_3_3_70_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.tre.2020.101922"},{"key":"e_1_3_3_71_1","first-page":"1","article-title":"Viable Supply Chain Model: Integrating Agility, Resilience and Sustainability Perspectives\u2013lessons From and Thinking Beyond the COVID-19 Pandemic","author":"Ivanov Dmitry.","year":"2020","unstructured":"Ivanov, Dmitry. 2020c. \u201cViable Supply Chain Model: Integrating Agility, Resilience and Sustainability Perspectives\u2013lessons From and Thinking Beyond the COVID-19 Pandemic.\u201d Annals of Operations Research 1\u201321.","journal-title":"Annals of Operations Research"},{"key":"e_1_3_3_72_1","doi-asserted-by":"publisher","DOI":"10.1109\/TEM.2021.3095193"},{"key":"e_1_3_3_73_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-70490-2"},{"key":"e_1_3_3_74_1","first-page":"1","article-title":"Blackout and Supply Chains: Cross-Structural Ripple Effect, Performance, Resilience and Viability Impact Analysis","author":"Ivanov Dmitry.","year":"2022","unstructured":"Ivanov, Dmitry. 2022a. \u201cBlackout and Supply Chains: Cross-Structural Ripple Effect, Performance, Resilience and Viability Impact Analysis.\u201d Annals of Operations Research 1\u201317.","journal-title":"Annals of Operations Research"},{"key":"e_1_3_3_75_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2022.2118892"},{"key":"e_1_3_3_76_1","doi-asserted-by":"publisher","DOI":"10.1504\/IJISM.2022.125995"},{"key":"e_1_3_3_77_1","doi-asserted-by":"publisher","DOI":"10.1080\/09537287.2020.1768450"},{"key":"e_1_3_3_78_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2022.2118889"},{"key":"e_1_3_3_79_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.arcontrol.2012.03.006"},{"key":"e_1_3_3_80_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.tre.2022.102676"},{"key":"e_1_3_3_81_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2012.08.021"},{"key":"e_1_3_3_82_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2020.1798035"},{"key":"e_1_3_3_83_1","doi-asserted-by":"crossref","unstructured":"Jackson Ilya. 2020. \u201cNeuroevolutionary Approach to Metamodeling of Production-Inventory Systems with Lost-Sales and Markovian Demand.\u201d In Lecture Notes in Networks and Systems 90\u201399. Cham: Springer International Publishing.","DOI":"10.1007\/978-3-030-44610-9_10"},{"key":"e_1_3_3_84_1","doi-asserted-by":"crossref","unstructured":"Jiang C.. 2008. \u201cTwo-dimensional Learning Mechanisms for Alliance Members in Multi-agent Supply Chains.\u201d In Proceedings of the International Conference on Information Management Innovation Management and Industrial Engineering ICIII 2008 Taipei Taiwan 524\u2013527. Vol. 2.","DOI":"10.1109\/ICIII.2008.86"},{"key":"e_1_3_3_85_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2008.07.036"},{"key":"e_1_3_3_86_1","doi-asserted-by":"publisher","DOI":"10.1504\/IJMTM.2008.017729"},{"key":"e_1_3_3_87_1","doi-asserted-by":"publisher","DOI":"10.3390\/a14080240"},{"key":"e_1_3_3_88_1","unstructured":"Khan Saif M. Alexander Mann and Dahlia Peterson. 2021. The Semiconductor Supply Chain: Assessing National Competitiveness. Technical Report. Center for Security and Emerging Technology. Accessed 27 December 2021. https:\/\/cset.georgetown.edu\/publication\/the-semiconductor-supply-chain\/."},{"key":"e_1_3_3_89_1","doi-asserted-by":"publisher","DOI":"10.1504\/IJSOI.2008.021340"},{"key":"e_1_3_3_90_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00170-004-2069-8"},{"key":"e_1_3_3_91_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-007-0038-2"},{"key":"e_1_3_3_92_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2010.07.077"},{"key":"e_1_3_3_93_1","doi-asserted-by":"publisher","DOI":"10.1145\/2949662"},{"key":"e_1_3_3_94_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2007.07.002"},{"key":"e_1_3_3_95_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-5885-2_18"},{"key":"e_1_3_3_96_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10257-018-0378-y"},{"key":"e_1_3_3_97_1","doi-asserted-by":"crossref","unstructured":"Li J. P. Guo and Z. Zuo. 2008. \u201cInventory Control Model for Mobile Supply Chain Management.\u201d In Proceedings \u2013 The 2008 International Conference on Embedded Software and Systems Symposia ICESS Symposia Chengdu China 459\u2013463.","DOI":"10.1109\/ICESS.Symposia.2008.85"},{"key":"e_1_3_3_98_1","doi-asserted-by":"crossref","unstructured":"Li X. W. Luo M. Yuan J. Wang J. Lu J. Wang J. Lu and J. Zeng. 2021. \u201cLearning to Optimize Industry-Scale Dynamic Pickup and Delivery Problems.\u201d In Proceedings \u2013 International Conference on Data Engineering Chania Greece 2511\u20132522","DOI":"10.1109\/ICDE51399.2021.00283"},{"key":"e_1_3_3_99_1","doi-asserted-by":"crossref","unstructured":"Li H. T. Pang Y. Wu and G. Jiang. 2014. \u201cConflict Resolution of Production-marketing Collaborative Planning Based on Multi-agent Self-adaptation Negotiation.\u201d In ICAART 2014 \u2013 Proceedings of the 6th International Conference on Agents and Artificial Intelligence Angers France 209\u2013214. Vol. 2.","DOI":"10.5220\/0004830602090214"},{"key":"e_1_3_3_100_1","doi-asserted-by":"crossref","unstructured":"Li Y. and J.-M. Zhao. 2006. \u201cApplying Adaptive Multi-agent Modeling in Agile Supply Chain Simulation.\u201d In Proceedings of the 2006 International Conference on Machine Learning and Cybernetics Dalian China 4191\u20134196.","DOI":"10.1109\/ICMLC.2006.258941"},{"key":"e_1_3_3_101_1","doi-asserted-by":"crossref","unstructured":"Li C. Y. S. H. Zhao T. W. Zhang and X. T. Wang. 2015. \u201cReinforcement Learning of Fuzzy Joint Replenishment Problem in Supply Chain.\u201d In Electronic Engineering and Information Science \u2013 Proceedings of the 2015 International Conference on Electronic Engineering and Information Science ICEEIS 2015 Harbin China 779\u2013782.","DOI":"10.1201\/b18471-185"},{"key":"e_1_3_3_102_1","doi-asserted-by":"publisher","DOI":"10.1109\/3468.844361"},{"key":"e_1_3_3_103_1","doi-asserted-by":"crossref","unstructured":"Liu C. 2020. \u201cOutsourcing Strategies for Manufacturers Facing Reputation Oriented Consumers.\u201d In Proceedings \u2013 2020 Chinese Automation Congress CAC 2020 Shanghai China 1980\u20131985.","DOI":"10.1109\/CAC51589.2020.9327763"},{"key":"e_1_3_3_104_1","doi-asserted-by":"crossref","unstructured":"Liu H. E. Howley and J. Duggan. 2011. \u201cAn Agent-Based Simulation of the Effects of Consumer Behavior on Market Price Dynamics.\u201d In Proceedings of the IASTED International Conference on Applied Simulation and Modelling ASM 2011 Crete Greece 316\u2013325.","DOI":"10.2316\/P.2011.715-003"},{"key":"e_1_3_3_105_1","doi-asserted-by":"crossref","unstructured":"Lu W. H. Tan X. Yan and C. Lv. 2021. \u201cSupply Chain Scheduling Using Double Deep Time-Series Differential Neural Network.\u201d In 5th International Workshop on Advances in Energy Science and Environment Engineering (AESEE 2021) E3S Web of Conferences 257 Xiamen China.","DOI":"10.1051\/e3sconf\/202125703038"},{"key":"e_1_3_3_106_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-323-91614-1.00001-0"},{"key":"e_1_3_3_107_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-323-91614-1.00001-0"},{"key":"e_1_3_3_108_1","doi-asserted-by":"crossref","unstructured":"Mahapatra Bandana and Srikanta Patnaik. 2018. \u201cAnt Colony Optimization.\u201d In Advances in Swarm Intelligence for Optimizing Problems in Computer Science 79\u2013114. 1st ed. Boca Raton FL: CRC Press\/Taylor & Francis Group [2019]: Chapman and Hall\/CRC.","DOI":"10.1201\/9780429445927-4"},{"key":"e_1_3_3_109_1","doi-asserted-by":"crossref","unstructured":"Makridis G. P. Mavrepis D. Kyriazis I. Polychronou and S. Kaloudis. 2020. \u201cEnhanced Food Safety Through Deep Learning for Food Recalls Prediction.\u201d Lecture Notes in Computer Science (Including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 12323 LNAI 566\u2013580 Cham: Springer.","DOI":"10.1007\/978-3-030-61527-7_37"},{"key":"e_1_3_3_110_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2019.04.032"},{"key":"e_1_3_3_111_1","doi-asserted-by":"crossref","unstructured":"Mehta D. and D. Yamparala. 2014. \u201cPolicy Gradient Reinforcement Learning for Solving Supply-chain Management Problems.\u201d In I-CARE 2014: Proceedings of the 6th IBM Collaborative Academia Research Exchange Conference (I-CARE) Bangalore India 1-4.","DOI":"10.1145\/2662117.2662129"},{"key":"e_1_3_3_112_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00521-021-06129-w"},{"key":"e_1_3_3_113_1","doi-asserted-by":"crossref","unstructured":"Mezouar H. and A. El Afia. 2019. \u201cA 4-level Reference for Self-adaptive Processes Based on SCOR and Integrating Q-Learning.\u201d In BDIoT'19: Proceedings of the 4th International Conference on Big Data and Internet of Things Rabat Morocco 1\u20135.","DOI":"10.1145\/3372938.3372953"},{"key":"e_1_3_3_114_1","unstructured":"Michie Donald and R. A. Chambers. 1968. \u201cBOXES: An Experiment in Adaptive Control.\u201d In Machine Intelligence edited by E. Dale and D. Michie. Edinburgh UK: Oliver and Boyd."},{"key":"e_1_3_3_115_1","doi-asserted-by":"publisher","DOI":"10.1109\/JRPROC.1961.287775"},{"key":"e_1_3_3_116_1","unstructured":"Mnih Volodymyr Adri\u00e0 Puigdom\u00e8nech Badia Mehdi Mirza Alex Graves Tim Harley Timothy P. Lillicrap David Silver and Koray Kavukcuoglu. 2016. \u201cAsynchronous Methods for Deep Reinforcement Learning.\u201d In Proceedings of the 33rd International Conference on International Conference on Machine Learning \u2013 Volume 48 ICML'16 1928\u20131937. JMLR.org."},{"key":"e_1_3_3_117_1","unstructured":"Mnih Volodymyr Koray Kavukcuoglu David Silver Alex Graves Ioannis Antonoglou Daan Wierstra and Martin Riedmiller. 2013. \u201cPlaying Atari with Deep Reinforcement Learning.\u201d."},{"key":"e_1_3_3_118_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2017.1401233"},{"key":"e_1_3_3_119_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11192-015-1765-5"},{"key":"e_1_3_3_120_1","doi-asserted-by":"publisher","DOI":"10.1613\/jair.613"},{"key":"e_1_3_3_121_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2014.09.004"},{"key":"e_1_3_3_122_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2013.04.033"},{"key":"e_1_3_3_123_1","doi-asserted-by":"crossref","unstructured":"Peng Z. Y. Zhang Y. Feng T. Zhang Z. Wu and H. Su. 2019. \u201cDeep Reinforcement Learning Approach for Capacitated Supply Chain Optimization Under Demand Uncertainty.\u201d In Proceedings \u2013 2019 Chinese Automation Congress CAC 2019 Hangzhou China 3512\u20133517.","DOI":"10.1109\/CAC48633.2019.8997498"},{"key":"e_1_3_3_124_1","doi-asserted-by":"publisher","DOI":"10.3390\/pr9010102"},{"key":"e_1_3_3_125_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207540110118640"},{"key":"e_1_3_3_126_1","doi-asserted-by":"publisher","DOI":"10.1186\/s12544-020-00437-3"},{"key":"e_1_3_3_127_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207720310001640755"},{"key":"e_1_3_3_128_1","doi-asserted-by":"publisher","DOI":"10.1080\/07408170490278698"},{"key":"e_1_3_3_129_1","doi-asserted-by":"crossref","unstructured":"Reeder J. G. Sukthankar M. Georgiopoulos and G. Anagnostopoulos. 2008. \u201cIntelligent Trading Agents for Massively Multi-player Game Economies.\u201d In Proceedings of the 4th Artificial Intelligence and Interactive Digital Entertainment Conference AIIDE 2008 Stanford California 102\u2013107.","DOI":"10.1609\/aiide.v4i1.18680"},{"key":"e_1_3_3_130_1","doi-asserted-by":"crossref","unstructured":"Reindorp M. J. and M. C. Fu. 2011. \u201cDynamic Lead Time Promising.\u201d In IEEE SSCI 2011: Symposium Series on Computational Intelligence \u2013 ADPRL 2011: 2011 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning Paris France 176\u2013183.","DOI":"10.1109\/ADPRL.2011.5967376"},{"key":"e_1_3_3_131_1","unstructured":"Ren C. Y. Chai and Y. Liu. 2002. \u201cAgile Supply Chain Simulation Using Adaptive Multi-agent Modeling.\u201d In Proceedings of Asian Simulation Conference; System Simulation and Scientific Computing Shanghai China 752\u2013756. Vol. 2."},{"key":"e_1_3_3_132_1","first-page":"1","article-title":"Supply Chain Viability: Conceptualization, Measurement, and Nomological Validation","author":"Ruel Salom\u00e9e","year":"2021","unstructured":"Ruel, Salom\u00e9e, Jamal El Baz, Dmitry Ivanov, and Ajay Das. 2021. \u201cSupply Chain Viability: Conceptualization, Measurement, and Nomological Validation.\u201d Annals of Operations Research1\u201330.","journal-title":"Annals of Operations Research"},{"key":"e_1_3_3_133_1","unstructured":"Rummery Gavin Adrian and Mahesan Niranjan. 1994. \u201cOn-line Q-learning Using Connectionist Systems.\u201d."},{"key":"e_1_3_3_134_1","doi-asserted-by":"crossref","unstructured":"Saitoh F. and A. Utani. 2013. \u201cCoordinated Rule Acquisition of Decision Making on Supply Chain by Exploitation-oriented Reinforcement Learning.\u201d Lecture Notes in Computer Science (including Subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics) 8131 LNCS 537\u2013544. Berlin Heidelberg: Springer.","DOI":"10.1007\/978-3-642-40728-4_67"},{"key":"e_1_3_3_135_1","doi-asserted-by":"crossref","unstructured":"Sakurai Yoshitaka Kouhei Takada Takashi Kawabe and Setsuo Tsuruta. 2010. \u201cA Method to Control Parameters of Evolutionary Algorithms by Using Reinforcement Learning.\u201d In 2010 Sixth International Conference on Signal-image Technology and Internet Based Systems 74\u201379. IEEE.","DOI":"10.1109\/SITIS.2010.22"},{"key":"e_1_3_3_136_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-658-33480-2_1"},{"key":"e_1_3_3_137_1","unstructured":"Schulman John Filip Wolski Prafulla Dhariwal Alec Radford and Oleg Klimov. 2017. \u201cProximal Policy Optimization Algorithms.\u201d."},{"key":"e_1_3_3_138_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-78288-7_10"},{"key":"e_1_3_3_139_1","volume-title":"The New (ab)normal: Reshaping Business and Supply Chain Strategy Beyond Covid-19","author":"Sheffi Yosef.","year":"2020","unstructured":"Sheffi, Yosef. 2020. The New (ab)normal: Reshaping Business and Supply Chain Strategy Beyond Covid-19. Cambridge (Mass.): MIT CTL Media. OCLC: 1258319911."},{"key":"e_1_3_3_140_1","volume-title":"A Shot in the Arm: How Science, Engineering, and Supply Chains Converged to Vaccinate the World","author":"Sheffi Yossi.","year":"2021","unstructured":"Sheffi, Yossi. 2021. A Shot in the Arm: How Science, Engineering, and Supply Chains Converged to Vaccinate the World. Cambridge: MIT CTL Media."},{"key":"e_1_3_3_141_1","doi-asserted-by":"crossref","unstructured":"Sheremetov L. and L. Rocha-Mier. 2004. \u201cCollective Intelligence As a Framework for Supply Chain Management.\u201d In 2004 2nd International IEEE Conference 'Intelligent Systems' \u2013 Proceedings Varna Bulgaria 417\u2013422. Vol. 2.","DOI":"10.1109\/IS.2004.1344783"},{"key":"e_1_3_3_142_1","doi-asserted-by":"publisher","DOI":"10.3233\/HSM-2008-27104"},{"key":"e_1_3_3_143_1","doi-asserted-by":"crossref","unstructured":"Sheremetov L. L. Rocha-Mier and I. Batyrshin. 2005. \u201cTowards a Multi-agent Dynamic Supply Chain Simulator for Analysis and Decision Support.\u201d In Annual Conference of the North American Fuzzy Information Processing Society \u2013 NAFIPS Detroit Michigan USA 263\u2013268.","DOI":"10.1109\/NAFIPS.2005.1548545"},{"key":"e_1_3_3_144_1","doi-asserted-by":"publisher","DOI":"10.3390\/inventions4010008"},{"key":"e_1_3_3_145_1","unstructured":"Silver David Thomas Hubert Julian Schrittwieser Ioannis Antonoglou Matthew Lai Arthur Guez and Marc Lanctot et\u00a0al. 2017. \u201cMastering Chess and Shogi by Self-Play with a General Reinforcement Learning Algorithm.\u201d."},{"key":"e_1_3_3_146_1","doi-asserted-by":"crossref","unstructured":"Simsek B. S. Albayrak and A. Korth. 2004. \u201cReinforcement Learning for Procurement Agents of the Factory of the Future.\u201d In Proceedings of the 2004 Congress on Evolutionary Computation CEC2004 Portland Oregon USA 1331\u20131337. Vol. 2.","DOI":"10.1109\/CEC.2004.1331051"},{"key":"e_1_3_3_147_1","doi-asserted-by":"crossref","unstructured":"Singi S. S. Gopal S. Auti and R. Chaurasia. 2020. \u201cReinforcement Learning for Inventory Management.\u201d In Proceedings of International Conference on Intelligent Manufacturing and Automation Lecture Notes in Mechanical Engineering 317\u2013326. Singapore: Springer.","DOI":"10.1007\/978-981-15-4485-9_33"},{"key":"e_1_3_3_148_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbusres.2019.07.039"},{"issue":"3","key":"e_1_3_3_149_1","first-page":"40","article-title":"Teaching Takes Off","volume":"35","author":"Sterman John D.","year":"1992","unstructured":"Sterman, John D. 1992. \u201cTeaching Takes Off.\u201d OR\/MS Today 35 (3): 40\u201344.","journal-title":"OR\/MS Today"},{"key":"e_1_3_3_150_1","doi-asserted-by":"publisher","DOI":"10.1080\/10429247.2010.11431878"},{"key":"e_1_3_3_151_1","doi-asserted-by":"crossref","unstructured":"Sun R. and G. Zhao. 2012. \u201cAnalyses About Efficiency of Reinforcement Learning to Supply Chain Ordering Management.\u201d In IEEE International Conference on Industrial Informatics (INDIN) Beijing China 124\u2013127.","DOI":"10.1109\/INDIN.2012.6301163"},{"key":"e_1_3_3_152_1","doi-asserted-by":"crossref","unstructured":"Sun R. G. Zhao C. Li and S. Tatsumi. 2006. \u201cThe Improvement on Reinforcement Learning for SCM by the Agent Policy Mapping.\u201d In IECON Proceedings (Industrial Electronics Conference) Paris France 3585\u20133590.","DOI":"10.1109\/IECON.2006.347360"},{"key":"e_1_3_3_153_1","doi-asserted-by":"crossref","unstructured":"Sun R. G. Zhao and C. Yin. 2010. \u201cA Multi-agent Coordination of a Supply Chain Ordering Management with Multiple Members Using Reinforcement Learning.\u201d In IEEE International Conference on Industrial Informatics (INDIN) Osaka Japan 612\u2013616.","DOI":"10.1109\/INDIN.2010.5549671"},{"key":"e_1_3_3_154_1","unstructured":"Sutton Richard S. and Andrew G. Barto. 2018. Reinforcement Learning: An Introduction. 2nd ed. Adaptive Computation and Machine Learning Series. Cambridge MA: The MIT Press."},{"key":"e_1_3_3_155_1","unstructured":"Sutton Richard S. David McAllester Satinder Singh and Yishay Mansour. 1999. \u201cPolicy Gradient Methods for Reinforcement Learning with Function Approximation.\u201d In Proceedings of the 12th International Conference on Neural Information Processing Systems NIPS'99 1057\u20131063. Cambridge MA USA: MIT Press."},{"key":"e_1_3_3_156_1","doi-asserted-by":"crossref","unstructured":"Tae I. K. R. U. Bilsel and S. R. T. Kumara. 2007. \u201cA Reinforcement Learning Approach for Dynamic Supplier Selection.\u201d In 2007 IEEE International Conference on Service Operations and Logistics and Informatics SOLI Philadelphia Pennsylvania USA 1-6.","DOI":"10.1109\/SOLI.2007.4383959"},{"key":"e_1_3_3_157_1","unstructured":"Tang K. and S. R. T. Kumara. 2005. \u201cCooperation in a Multi-Stage Game for Modeling Distributed Task Delegation in a Supply Chain Procurement Problem.\u201d In Proceedings of the 2005 IEEE Conference on Automation Science and Engineering IEEE-CASE 2005 Edmonton Alberta Canada 93\u201398."},{"key":"e_1_3_3_158_1","doi-asserted-by":"crossref","unstructured":"Tariq Afridi M. S. Nieto-Isaza H. Ehm T. Ponsignon and A. Hamed. 2020. \u201cA Deep Reinforcement Learning Approach for Optimal Replenishment Policy in A Vendor Managed Inventory Setting for Semiconductors.\u201d In Proceedings \u2013 Winter Simulation Conference Orlando Florida USA 1753\u20131764.","DOI":"10.1109\/WSC48552.2020.9384048"},{"key":"e_1_3_3_159_1","doi-asserted-by":"publisher","DOI":"10.1037\/h0092987"},{"key":"e_1_3_3_160_1","unstructured":"UNO. 2008. \u201cInternational Standard Industrial Classification of All Economic Activities (ISIC) Rev.4.\u201d."},{"key":"e_1_3_3_161_1","doi-asserted-by":"publisher","DOI":"10.1142\/S0129065709002063"},{"key":"e_1_3_3_162_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11192-009-0146-3"},{"key":"e_1_3_3_163_1","doi-asserted-by":"crossref","unstructured":"Van Tongeren T. U. Kaymak D. Naso and E. Van Asperen. 2007. \u201cQ-learning in a Competitive Supply Chain.\u201d In Conference Proceedings \u2013 IEEE International Conference on Systems Man and Cybernetics Montreal Quebec Canada 1211\u20131216.","DOI":"10.1109\/ICSMC.2007.4414132"},{"key":"e_1_3_3_164_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.compind.2020.103239"},{"key":"e_1_3_3_165_1","unstructured":"Vinitsky Eugene Nathan Lichtle Kanaad Parvate and Alexandre Bayen. 2020. \u201cOptimizing Mixed Autonomy Traffic Flow with Decentralized Autonomous Vehicles and Multi-agent RL.\u201d."},{"key":"e_1_3_3_166_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2015.07.022"},{"key":"e_1_3_3_167_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2021.107312"},{"key":"e_1_3_3_168_1","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2021.2020927"},{"key":"e_1_3_3_169_1","unstructured":"Ware Mark and Michael Mabe. 2015. The STM Report: An Overview of Scientific and Scholarly Journal Publishing. Technical Report. International Association of Scientific Technical and Medical Publishers."},{"key":"e_1_3_3_170_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00992698"},{"key":"e_1_3_3_171_1","doi-asserted-by":"publisher","DOI":"10.1186\/1741-7015-11-20"},{"key":"e_1_3_3_172_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.energy.2020.118597"},{"key":"e_1_3_3_173_1","doi-asserted-by":"crossref","unstructured":"Xu J. J. Zhang and Y. Liu. 2009. \u201cAn Adaptive Inventory Control for a Supply Chain.\u201d In 2009 Chinese Control and Decision Conference CCDC 2009 Guilin China 5714\u20135719.","DOI":"10.1109\/CCDC.2009.5195218"},{"key":"e_1_3_3_174_1","doi-asserted-by":"crossref","unstructured":"Yang S. Y. Ogawa K. Ikeuchi Y. Akiyama and R. Shibasaki. 2019. \u201cFirm-level Behavior Control After Large-Scale Urban Flooding Using Multi-agent Deep Reinforcement Learning.\u201d In Proceedings of the 2nd ACM SIGSPATIAL International Workshop on GeoSpatial Simulation GeoSim 2019 Chicago Illinois USA 24\u201327.","DOI":"10.1145\/3356470.3365529"},{"key":"e_1_3_3_175_1","doi-asserted-by":"crossref","unstructured":"Yang S. and J. Zhang. 2015. \u201cAdaptive Inventory Control and Bullwhip Effect Analysis for Supply Chains with Non-Stationary Demand.\u201d In Proceedings of the 2015 27th Chinese Control and Decision Conference CCDC 2015 Qingdao China 3903\u20133908.","DOI":"10.1109\/CCDC.2015.7162605"},{"key":"e_1_3_3_176_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00170-012-4195-z"},{"key":"e_1_3_3_177_1","doi-asserted-by":"publisher","DOI":"10.1080\/17517570701275390"},{"key":"e_1_3_3_178_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-323-91614-1.00005-8"},{"key":"e_1_3_3_179_1","unstructured":"Zhang Daniel Saurabh Mishra Erik Brynjolfsson John Etchemendy Deep Ganguli Barbara Grosz and Terah Lyons et\u00a0al. 2021. \u201cThe AI Index 2021 Annual Report.\u201d."},{"key":"e_1_3_3_180_1","doi-asserted-by":"crossref","unstructured":"Zhang K. J. Xu and J. Zhang. 2013. \u201cA New Adaptive Inventory Control Method for Supply Chains with Non-Stationary Demand.\u201d In 2013 25th Chinese Control and Decision Conference CCDC 2013 Guiyang China 1034\u20131038.","DOI":"10.1109\/CCDC.2013.6561076"},{"key":"e_1_3_3_181_1","unstructured":"Zhang L. Y. Yin L. Feng and H. Fan. 2019. \u201cUnsalable Risk Prediction of Fruit and Vegetable Agricultural Products Based on Markov Decision Process.\u201d In Proceedings of the 8th International Conference on Logistics and Systems Engineering 2018 Changsha City China 206\u2013217."},{"key":"e_1_3_3_182_1","doi-asserted-by":"crossref","unstructured":"Zhanguo X. 2008. \u201cResearch on Refining the Distributed Supply Chain Procurement Plans Based on CRL.\u201d In Proceedings \u2013 International Symposium on Information Processing ISIP 2008 and International Pacific Workshop on Web Mining and Web-Based Application WMWA 2008 Moscow Russia 119\u2013122.","DOI":"10.1109\/ISIP.2008.53"},{"key":"e_1_3_3_183_1","doi-asserted-by":"crossref","unstructured":"Zhao Y. E. Hemberg N. Derbinsky G. Mata and U.-M. O'Reilly. 2021a. \u201cSimulating a Logistics Enterprise Using An Asymmetrical Wargame Simulation with Soar Reinforcement Learning and Coevolutionary Algorithms.\u201d In GECCO 2021 Companion \u2013 Proceedings of the 2021 Genetic and Evolutionary Computation Conference Companion Lille France 1907\u20131915.","DOI":"10.1145\/3449726.3463172"},{"issue":"4","key":"e_1_3_3_184_1","first-page":"667","article-title":"Coordinating Supply Chain of Stackelberg Game Model Based on Evolutionary Game with GA-RL","volume":"30","author":"Zhao H.-P.","year":"2010","unstructured":"Zhao, H.-P., J.-D. Jiang, and Y.-C. Feng. 2010. \u201cCoordinating Supply Chain of Stackelberg Game Model Based on Evolutionary Game with GA-RL.\u201d Xitong Gongcheng Lilun yu Shijian\/System Engineering Theory and Practice 30 (4): 667\u2013672.","journal-title":"Xitong Gongcheng Lilun yu Shijian\/System Engineering Theory and Practice"},{"key":"e_1_3_3_185_1","unstructured":"Zhao Long and Zemin Liu. 1996. \u201cA Genetic Algorithm for Reinforcement Learning.\u201d In Proceedings of International Conference on Neural Networks (ICNN'96) Washington DC USA. 1056-1060."},{"key":"e_1_3_3_186_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2020.107082"},{"key":"e_1_3_3_187_1","doi-asserted-by":"crossref","unstructured":"Zhou J. M. Purvis and Y. Muhammad. 2016. \u201cA Combined Modelling Approach for Multi-Agent Collaborative Planning in Global Supply Chains.\u201d In Proceedings \u2013 2015 8th International Symposium on Computational Intelligence and Design ISCID 2015 Hangzhou China 592\u2013597. Vol. 1.","DOI":"10.1109\/ISCID.2015.13"},{"key":"e_1_3_3_188_1","doi-asserted-by":"crossref","unstructured":"Zhou J. and X. Zhou. 2019. \u201cMulti-Echelon Inventory Optimizations for Divergent Networks by Combining Deep Reinforcement Learning and Heuristics Improvement.\u201d In Proceedings \u2013 2019 12th International Symposium on Computational Intelligence and Design ISCID 2019 Hangzhou China 69\u201373. Vol. 1.","DOI":"10.1109\/ISCID.2019.00023"},{"key":"e_1_3_3_189_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.trb.2021.06.014"},{"key":"e_1_3_3_190_1","doi-asserted-by":"publisher","DOI":"10.3390\/app11062726"}],"container-title":["International Journal of Production Research"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.tandfonline.com\/doi\/pdf\/10.1080\/00207543.2022.2140221","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,5]],"date-time":"2025-09-05T00:08:54Z","timestamp":1757030934000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.tandfonline.com\/doi\/full\/10.1080\/00207543.2022.2140221"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11,3]]},"references-count":189,"journal-issue":{"issue":"20","published-print":{"date-parts":[[2023,10,18]]}},"alternative-id":["10.1080\/00207543.2022.2140221"],"URL":"https:\/\/doi.org\/10.1080\/00207543.2022.2140221","relation":{},"ISSN":["0020-7543","1366-588X"],"issn-type":[{"value":"0020-7543","type":"print"},{"value":"1366-588X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,11,3]]},"assertion":[{"value":"The publishing and review policy for this title is described in its Aims & Scope.","order":1,"name":"peerreview_statement","label":"Peer Review Statement"},{"value":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tprs20","URL":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tprs20","order":2,"name":"aims_and_scope_url","label":"Aim & Scope"},{"value":"2022-06-17","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2022-10-13","order":2,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2022-11-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}