{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,16]],"date-time":"2026-02-16T16:48:36Z","timestamp":1771260516990,"version":"3.50.1"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030143466","type":"print"},{"value":"9783030143473","type":"electronic"}],"license":[{"start":{"date-parts":[[2019,3,21]],"date-time":"2019-03-21T00:00:00Z","timestamp":1553126400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-14347-3_34","type":"book-chapter","created":{"date-parts":[[2019,3,20]],"date-time":"2019-03-20T08:08:34Z","timestamp":1553069314000},"page":"350-359","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":53,"title":["Deep Reinforcement Learning as a Job Shop Scheduling Solver: A Literature Review"],"prefix":"10.1007","author":[{"given":"Bruno","family":"Cunha","sequence":"first","affiliation":[]},{"given":"Ana M.","family":"Madureira","sequence":"additional","affiliation":[]},{"given":"Benjamim","family":"Fonseca","sequence":"additional","affiliation":[]},{"given":"Duarte","family":"Coelho","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,3,21]]},"reference":[{"issue":"2","key":"34_CR1","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1109\/32.4634","volume":"14","author":"TL Casavant","year":"1988","unstructured":"Casavant, T.L., Kuhl, J.G.: A taxonomy of scheduling in general-purpose distributed computing systems. IEEE Trans. Softw. Eng. 14(2), 141\u2013154 (1988)","journal-title":"IEEE Trans. Softw. Eng."},{"issue":"4","key":"34_CR2","doi-asserted-by":"publisher","first-page":"833","DOI":"10.1111\/j.1540-5915.2000.tb00945.x","volume":"31","author":"S Ahire","year":"2000","unstructured":"Ahire, S., Greenwood, G., et al.: Workforce-constrained preventive maintenance scheduling using evolution strategies. Decis. Sci. 31(4), 833\u2013859 (2000)","journal-title":"Decis. Sci."},{"issue":"8","key":"34_CR3","doi-asserted-by":"publisher","first-page":"2269","DOI":"10.1080\/002075498192896","volume":"36","author":"AI Sonmez","year":"1998","unstructured":"Sonmez, A.I., Baykasoglu, A.: A new dynamic programming formulation of (n x m) flowshop sequencing problems with due dates. Int. J. Prod. Res. 36(8), 2269\u20132283 (1998)","journal-title":"Int. J. Prod. Res."},{"key":"34_CR4","doi-asserted-by":"crossref","unstructured":"Yamada, T., Yamada, T., Nakano, R.: Genetic algorithms for job-shop scheduling problems. In: Modern Heuristic for Decision Support, pp. 474\u2013479 (1997)","DOI":"10.1049\/PBCE055E_ch7"},{"issue":"4","key":"34_CR5","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1287\/inte.18.4.84","volume":"18","author":"KN McKay","year":"1988","unstructured":"McKay, K.N., Safayeni, F.R., Buzacott, J.A.: Job-shop scheduling theory: what is relevant? Interfaces 18(4), 84\u201390 (1988)","journal-title":"Interfaces"},{"key":"34_CR6","first-page":"445","volume":"4","author":"EL Lawler","year":"1993","unstructured":"Lawler, E.L., Lenstra, J.K., et al.: Sequencing and scheduling: algorithms and complexity. Handb. Oper. Res. Manag. Sci. 4, 445\u2013522 (1993)","journal-title":"Handb. Oper. Res. Manag. Sci."},{"issue":"7553","key":"34_CR7","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436 (2015)","journal-title":"Nature"},{"key":"34_CR8","unstructured":"Knight, W.: Reinforcement Learning: 10 Breakthrough Technologies 2017 - MIT Technology Review (2017)"},{"key":"34_CR9","volume-title":"Scheduling: Theory, Algorithms, and Systems","author":"ML Pinedo","year":"2008","unstructured":"Pinedo, M.L.: Scheduling: Theory, Algorithms, and Systems, 4th edn. Springer, New York (2008)","edition":"4"},{"key":"34_CR10","unstructured":"Madureira, A., Pereira, I., Falc\u00e3o, D.: Dynamic adaptation for scheduling under rush manufacturing orders with case-based reasoning. In: International Conference on Algebraic and Symbolic Computation (2013)"},{"key":"34_CR11","doi-asserted-by":"publisher","first-page":"471","DOI":"10.1023\/A:1025753309346","volume":"14","author":"YH Lee","year":"2003","unstructured":"Lee, Y.H., Kumara, S.R.T., Chatterjee, K.: Multiagent based dynamic resource scheduling for distributed multiple projects using a market mechanism. J. Intell. Manuf. 14, 471\u2013484 (2003)","journal-title":"J. Intell. Manuf."},{"key":"34_CR12","unstructured":"Ouelhadj, D., Cowling, P., Petrovic, S.: Utility and stability measures for agent-based dynamic scheduling of steel continuous casting. In: 2003 IEEE International Conference on Robotics and Automation, vol. 1 (2003)"},{"key":"34_CR13","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1002\/nav.20488","volume":"59","author":"S Goren","year":"2012","unstructured":"Goren, S., Sabuncuoglu, I., Koc, U.: Optimization of schedule stability and efficiency under processing time variability and random machine breakdowns in a job shop environment. Naval Res. Logistics 59, 26\u201338 (2012)","journal-title":"Naval Res. Logistics"},{"key":"34_CR14","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1016\/j.cie.2016.07.020","volume":"99","author":"M Dios","year":"2016","unstructured":"Dios, M., Framinan, J.M.: A review and classification of computer-based manufacturing scheduling tools. Comput. Industr. Eng. 99, 229\u2013249 (2016)","journal-title":"Comput. Industr. Eng."},{"key":"34_CR15","doi-asserted-by":"crossref","unstructured":"Cunha, B., Madureira, A., et\u00a0al.: Evaluating the effectiveness of Bayesian and neural networks for adaptive scheduling systems. In: 2016 IEEE Symposium Series on Computational Intelligence (SSCI), pp. 1\u20136. IEEE, December 2016","DOI":"10.1109\/SSCI.2016.7849997"},{"key":"34_CR16","doi-asserted-by":"crossref","unstructured":"Madureira, A., Gomes, S., et\u00a0al.: Prototype of an adaptive decision support system for interactive scheduling with metacognition and user modeling experience. In: Sixth World Congress on Nature and Biologically Inspired Computing (NaBIC) (2014)","DOI":"10.1109\/NaBIC.2014.6921869"},{"key":"34_CR17","doi-asserted-by":"publisher","first-page":"771","DOI":"10.1007\/978-3-319-53480-0_76","volume-title":"ISDA 2016","author":"A Madureira","year":"2017","unstructured":"Madureira, A., Pereira, I., Cunha, B.: Specification of an architecture for self-organizing scheduling systems. In: Madureira, A., Abraham, A., Gamboa, D., Novais, P. (eds.) ISDA 2016, vol. 557, pp. 771\u2013780. Springer, Heidelberg (2017). https:\/\/doi.org\/10.1007\/978-3-319-53480-0_76"},{"key":"34_CR18","doi-asserted-by":"publisher","DOI":"10.1002\/9780470496916","volume-title":"Metaheuristics: From Design to Implementation","author":"EG Talbi","year":"2009","unstructured":"Talbi, E.G.: Metaheuristics: From Design to Implementation. Wiley, Hoboken (2009)"},{"key":"34_CR19","doi-asserted-by":"publisher","DOI":"10.1201\/9781420010749","volume-title":"Handbook of Approximation Algorithms and Metaheuristics","author":"T Gonzalez","year":"2007","unstructured":"Gonzalez, T.: Handbook of Approximation Algorithms and Metaheuristics. Chapman & Hall, London (2007)"},{"issue":"5","key":"34_CR20","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1016\/0305-0548(86)90048-1","volume":"13","author":"F Glover","year":"1986","unstructured":"Glover, F.: Future paths for integer programming and links to artificial intelligence. Comput. Oper. Res. 13(5), 533\u2013549 (1986)","journal-title":"Comput. Oper. Res."},{"key":"34_CR21","unstructured":"Holland, J.H.: Adaptation in Natural and Artificial Systems, p. 183. University of Michigan Press, Ann Arbor (1975)"},{"issue":"4","key":"34_CR22","first-page":"393","volume":"12","author":"RMA Rangel-Merino","year":"2005","unstructured":"Rangel-Merino, R.M.A., L\u00f3pez-Bonilla, J.L.: Optimization Method Based on Genetic Algorithms. Apeiron 12(4), 393\u2013408 (2005)","journal-title":"Apeiron"},{"key":"34_CR23","doi-asserted-by":"crossref","unstructured":"Ludvig, E.A., Bellemare, M.G., Pearson, K.G.: A primer on reinforcement learning in the brain: psychological, computational, and neural perspectives. In: Computational Neuroscience for Advancing Artificial Intelligence: Models, Methods and Applications, pp. 111\u2013144. IGI Global (2011)","DOI":"10.4018\/978-1-60960-021-1.ch006"},{"key":"34_CR24","doi-asserted-by":"crossref","unstructured":"Degris, T., Pilarski, P., Sutton, R.: Model-free reinforcement learning with continuous action in practice. In: 2012 American Control Conference (ACC), pp. 2177\u20132182. IEEE (2012)","DOI":"10.1109\/ACC.2012.6315022"},{"issue":"3\u20134","key":"34_CR25","first-page":"279","volume":"8","author":"CJCH Watkins","year":"1992","unstructured":"Watkins, C.J.C.H., Dayan, P.: Q-learning. Mach. Learn. 8(3\u20134), 279\u2013292 (1992)","journal-title":"Mach. Learn."},{"key":"34_CR26","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1613\/jair.301","volume":"4","author":"LP Kaelbling","year":"1996","unstructured":"Kaelbling, L.P., Littman, M.L., Moore, A.W.: Reinforcement learning: a survey. J. Artif. Intell. Res. 4, 237\u2013285 (1996)","journal-title":"J. Artif. Intell. Res."},{"key":"34_CR27","unstructured":"Mnih, V., Kavukcuoglu, K., et\u00a0al.: Playing Atari with Deep Reinforcement Learning. ArXiv e-prints, no. 1312.5602 (2013)"},{"key":"34_CR28","unstructured":"Lillicrap, T.P., Hunt, J.J., et\u00a0al.: Continuous control with deep reinforcement learning, September 2015"},{"key":"34_CR29","unstructured":"Plappert, M., Houthooft, R., et\u00a0al.: Parameter Space Noise for Exploration (2017)"},{"issue":"11","key":"34_CR30","doi-asserted-by":"publisher","first-page":"1069","DOI":"10.1057\/jors.1990.166","volume":"41","author":"JE Beasley","year":"1990","unstructured":"Beasley, J.E.: OR-Library: distributing test problems by electronic mail. J. Oper. Res. Soc. 41(11), 1069\u20131072 (1990)","journal-title":"J. Oper. Res. Soc."},{"issue":"2","key":"34_CR31","doi-asserted-by":"publisher","first-page":"278","DOI":"10.1016\/0377-2217(93)90182-M","volume":"64","author":"E Taillard","year":"1993","unstructured":"Taillard, E.: Benchmarks for basic scheduling problems. Eur. J. Oper. Res. 64(2), 278\u2013285 (1993)","journal-title":"Eur. J. Oper. Res."}],"container-title":["Advances in Intelligent Systems and Computing","Hybrid Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-14347-3_34","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,14]],"date-time":"2022-09-14T01:21:12Z","timestamp":1663118472000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-14347-3_34"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,3,21]]},"ISBN":["9783030143466","9783030143473"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-14347-3_34","relation":{},"ISSN":["2194-5357","2194-5365"],"issn-type":[{"value":"2194-5357","type":"print"},{"value":"2194-5365","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,3,21]]},"assertion":[{"value":"21 March 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"HIS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Hybrid Intelligent Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Porto","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Portugal","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 December 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 December 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"his2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.mirlabs.net\/his18\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}