{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:11:24Z","timestamp":1767337884235,"version":"3.40.3"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031824807"},{"type":"electronic","value":"9783031824814"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-82481-4_22","type":"book-chapter","created":{"date-parts":[[2025,3,3]],"date-time":"2025-03-03T15:45:35Z","timestamp":1741016735000},"page":"317-332","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Generative Reward Machine for\u00a0Reinforcement Learning for\u00a0Physical Internet Distribution Centre"],"prefix":"10.1007","author":[{"given":"Saeid","family":"Rezaei","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2662-6875","authenticated-orcid":false,"given":"Kenneth","family":"N. Brown","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,3,4]]},"reference":[{"key":"22_CR1","unstructured":"Alliance for Logistics Innovation through Collaboration in Europe (ALICE). Roadmap to the Physical Internet - executive version. http:\/\/etp-alice.eu. Accessed 30 Mar 2024"},{"key":"22_CR2","unstructured":"Bahrami-Bidoni Z., Montreuil B.: Predictive demand modeling for new services in hyperconnected urban parcel logistics. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR3","unstructured":"Ban S., DAN A., Guinet F., Portanguen J., Srang S., Lauras M.: Assessing the potentialities of physical internet for developing countries last mile deliveries. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR4","doi-asserted-by":"crossref","unstructured":"Belsare, S., Badilla, E. D., and Dehghanimohammadabadi, M.: Reinforcement Learning with Discrete Event Simulation: The Premise, Reality, and Promise. In: 2022 Winter Simulation Conference (WSC), (pp. 2724\u20132735). IEEE","DOI":"10.1109\/WSC57314.2022.10015503"},{"key":"22_CR5","unstructured":"Bisschop, J. (2006). AIMMS optimization modeling. Lulu.com"},{"key":"22_CR6","unstructured":"Boerger J., Montreuil B.: Data-driven analytics-based capacity management for hyperconnected third-party logistics providers. In: 7th International Physical Internet Conference (2020)"},{"key":"22_CR7","unstructured":"Campos M., Derhami S., McGinnis L., Montreuil B., Barenji A.V.: Digital twin design requirements for durable goods distribution in physical internet. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR8","unstructured":"Cipres D., Capella A., Polo L., Ramon J.L.: GPICS a framework to create a digital twin for the Physical Internet. In: 7th International Physical Internet Conference (2021)D"},{"key":"22_CR9","doi-asserted-by":"crossref","unstructured":"Devanga, A., Badilla, E. D., Dehghanimohammadabadi, M.: Applied Reinforcement Learning for Decision Making in Industrial Simulation Environments. In: 2022 Winter Simulation Conference (WSC), (pp. 2819\u20132829). IEEE","DOI":"10.1109\/WSC57314.2022.10015282"},{"key":"22_CR10","unstructured":"Dulac-Arnold, G., et al.: An empirical investigation of the challenges of real-world reinforcement learning. arXiv preprint arXiv:2003.11881. (2020)"},{"key":"22_CR11","unstructured":"Garnier C., Simon E., Costa J.P., Pitsikas L., Lacalle I., Palau C.E.: Port digitalization through an activities scenario model as a first step for a digital twin of port. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR12","unstructured":"Gosch L., Prandtstetter M., Doerner K.F.: On modelling and solving green collaborative tactical transportation planning. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR13","unstructured":"Hubbs, C.D., Perez, H.D., Sarwar,O., Sahinidis, N.V., Grossmann, I.E., Wassick, J.M.: Or-gym: A reinforcement learning library for operations research problems. arXiv preprint arXiv:2008.06319 (2020)"},{"key":"22_CR14","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1613\/jair.1.12440","volume":"73","author":"RT Icarte","year":"2022","unstructured":"Icarte, R.T., Klassen, T.Q., Valenzano, R., McIlraith, S.A.: Reward machines: exploiting reward function structure in reinforcement learning. J. Artif. Intell. Res. 73, 173\u2013208 (2022)","journal-title":"J. Artif. Intell. Res."},{"key":"22_CR15","unstructured":"International Transport Forum (2019) ITF Transport Outlook 2019. OECD Publishing. https:\/\/play.google.com\/store\/books\/details?id=p8SZDwAAQBAJ"},{"key":"22_CR16","unstructured":"Kaboudvand S., Montreuil B.: Dynamic containerized consolidation in physical internet enabled parcel logistics. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR17","unstructured":"Kaboudvand S., Campos, M., Montreuil, B.: Enabling scientific assessment of large scale hyperconnected urban parcel logistics: agent-based simulator design. In: Proceedings of 2021 IISE Annual Conference, Virtual, May 22\u201325 (2021)"},{"key":"22_CR18","unstructured":"Kim N., Montreuil B., Klibi W.: Modularization of delivery and transportation. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR19","doi-asserted-by":"crossref","unstructured":"Lang, L., Chwif, L., Pereira, W.: Decision-making impacts of originating picking waves process for a distribution center using discrete-event simulation. In: 2022 Winter Simulation Conference (WSC), (pp. 1509\u20131520). IEEE (2022)","DOI":"10.1109\/WSC57314.2022.10015343"},{"key":"22_CR20","doi-asserted-by":"crossref","unstructured":"Liu, K., et al.: Automated feature selection, A reinforcement learning perspective. IEEE Transactions on Knowledge and Data Engineering (2021)","DOI":"10.1109\/TKDE.2021.3115477"},{"key":"22_CR21","unstructured":"Lischke A., Kirsten S., Bremeersch T., Jessberger C.: Impact of high capacity vehicles on the future developments in the logistics sector. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR22","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.119883","volume":"224","author":"M Mussi","year":"2023","unstructured":"Mussi, M., Lombarda, D., Metelli, A.M., Trov\u00f2, F., Restelli, M.: ARLO: a framework for automated reinforcement learning. Expert Syst. Appl. 224, 119883 (2023)","journal-title":"Expert Syst. Appl."},{"key":"22_CR23","unstructured":"Muthukrishnan P., Faug\u00e8re L., Montreuil B.: Potential access hub network design optimization in hyperconnected urban logistics. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR24","unstructured":"Pan X., Pothen A., Boerger J., Wang H., Montreuil B.: Enhancing logistics demand prediction accuracy through client\u2013vendor hyperconnected data ensembles. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR25","doi-asserted-by":"publisher","first-page":"517","DOI":"10.1613\/jair.1.13596","volume":"74","author":"J Parker-Holder","year":"2022","unstructured":"Parker-Holder, J., et al.: Automated reinforcement learning (autorl): A survey and open problems. J. Artif. Intell. Res. 74, 517\u2013568 (2022)","journal-title":"J. Artif. Intell. Res."},{"key":"22_CR26","unstructured":"Patrick B., Farzaneh D., Taha F., Chibuzor U.: Improving demand prediction and reducing out-of-stock application of advanced data analytics in retail supply chains. In: 7th International Physical Internet Conference (2021)"},{"issue":"3","key":"22_CR27","doi-asserted-by":"publisher","first-page":"553","DOI":"10.1287\/ijoc.2016.0696","volume":"28","author":"K Postek","year":"2016","unstructured":"Postek, K., Hertog, D.D.: Multistage adjustable robust mixed-integer optimization via iterative splitting of the uncertainty set. INFORMS J. Comput. 28(3), 553\u2013574 (2016)","journal-title":"INFORMS J. Comput."},{"key":"22_CR28","doi-asserted-by":"crossref","unstructured":"Powell, W.B.: Reinforcement Learning and Stochastic Optimization: A Unified Framework for Sequential Decisions. Wiley and Sons (2022)","DOI":"10.1002\/9781119815068"},{"key":"22_CR29","volume-title":"Markov decision processes: discrete stochastic dynamic programming","author":"ML Puterman","year":"2014","unstructured":"Puterman, M.L.: Markov decision processes: discrete stochastic dynamic programming. John Wiley and Sons (2014)"},{"key":"22_CR30","unstructured":"Quak H., Kempen E.V., Vries J.D.: Towards a self-organizing logistics system: identifying the value of SOLs for different stakeholders and transition-phases. In: 7th International Physical Internet Conference, (2021)"},{"key":"22_CR31","doi-asserted-by":"crossref","unstructured":"Rezaei S., Toffano F., Brown K.N.: Gym-DC: a distribution centre reinforcement learning environment. In: 2nd International Workshop on Industrial Machine Learning (2022)","DOI":"10.1007\/978-3-031-37742-6_53"},{"key":"22_CR32","unstructured":"Shaikh S.J., Montreuil B., Moussa Hodjat-Shamami M., Ashish Gupta A.: Introducing services and protocols for inter-hub transportation in the physical internet. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR33","doi-asserted-by":"crossref","unstructured":"Silver, D., et al.: Mastering the game of Go with deep neural networks and tree search. Nature 529(7587), 484\u2013489 (2016)","DOI":"10.1038\/nature16961"},{"key":"22_CR34","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement learning: An introduction. MIT press (2018)"},{"key":"22_CR35","doi-asserted-by":"crossref","unstructured":"Xie, S., Zhang, T., Rose, O.: Real-time scheduling based on simulation and deep reinforcement learning with featured action space. In: 2022 Winter Simulation Conference (WSC) (pp. 1731-1739). IEEE (2022)","DOI":"10.1109\/WSC57314.2022.10015423"},{"key":"22_CR36","doi-asserted-by":"publisher","DOI":"10.1016\/j.tre.2022.102712","volume":"162","author":"Y Yan","year":"2022","unstructured":"Yan, Y., Chow, A.H., Ho, C.P., Kuo, Y.H., Wu, Q., Ying, C.: Reinforcement learning for logistics and supply chain management: Methodologies, state of the art, and future opportunities. Transport. Res. Part E: Logist. Transport. Rev. 162, 102712 (2022)","journal-title":"Transport. Res. Part E: Logist. Transport. Rev."},{"key":"22_CR37","unstructured":"Zavitsas K., Kouloumbis M.: Towards PI implementation: interoperability and robustness of pi layers functionality illustrated through multi-context implementation. In: 7th International Physical Internet Conference (2021)"},{"key":"22_CR38","unstructured":"Zhang J., Thompson R.G. (2021): Optimising Product Swaps in Urban Retail Networks. In: 7th International Physical Internet Conference, 2021"},{"key":"22_CR39","unstructured":"Lillicrap, T.P., et al.: Continuous control with deep reinforcement learning. arXiv preprint arXiv:1509.02971 (2015)"},{"key":"22_CR40","unstructured":"Author, A., Another, B.: Towards explainable topsis: visual insights into the effects of weights and aggregations on rankings. J. Decision Making (2023)"},{"key":"22_CR41","doi-asserted-by":"crossref","unstructured":"Rezaei, S., Toffano, F., Brown, K.N.: Gym-DC: a distribution centre reinforcement learning environment. In: International Conference on Pattern Recognition, pp. 687\u2013699 (2022)","DOI":"10.1007\/978-3-031-37742-6_53"},{"key":"22_CR42","first-page":"151","volume-title":"Physical Internet Foundations","author":"B Montreuil","year":"2013","unstructured":"Montreuil, B., Meller, R.D., Ballot, E.: Physical Internet Foundations, pp. 151\u2013166. Springer, Berlin Heidelberg (2013)"}],"container-title":["Lecture Notes in Computer Science","Machine Learning, Optimization, and Data Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-82481-4_22","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,3]],"date-time":"2025-03-03T15:45:49Z","timestamp":1741016749000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-82481-4_22"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031824807","9783031824814"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-82481-4_22","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"4 March 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}