{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,5,1]],"date-time":"2024-05-01T00:22:03Z","timestamp":1714522923624},"reference-count":54,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2024,4,1]],"date-time":"2024-04-01T00:00:00Z","timestamp":1711929600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2024,4,1]],"date-time":"2024-04-01T00:00:00Z","timestamp":1711929600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2024,4,29]],"date-time":"2024-04-29T00:00:00Z","timestamp":1714348800000},"content-version":"vor","delay-in-days":28,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Computers &amp; Industrial Engineering"],"published-print":{"date-parts":[[2024,4]]},"DOI":"10.1016\/j.cie.2024.110044","type":"journal-article","created":{"date-parts":[[2024,3,6]],"date-time":"2024-03-06T17:21:40Z","timestamp":1709745700000},"page":"110044","update-policy":"http:\/\/dx.doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"title":["Reinforcement Learning for Disassembly Task Control"],"prefix":"10.1016","volume":"190","author":[{"given":"Sachini","family":"Weerasekara","sequence":"first","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0009-0001-0131-4955","authenticated-orcid":false,"given":"Wei","family":"Li","sequence":"additional","affiliation":[]},{"given":"Jacqueline","family":"Isaacs","sequence":"additional","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0001-5845-7714","authenticated-orcid":false,"given":"Sagar","family":"Kamarthi","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.cie.2024.110044_b1","series-title":"E-waste statistics","author":"Alianza Recycling & Recovery","year":"2023"},{"key":"10.1016\/j.cie.2024.110044_b2","doi-asserted-by":"crossref","DOI":"10.1016\/j.ijpe.2022.108673","article-title":"Hybridizations in line balancing problems: A comprehensive review on new trends and formulations","author":"Batta\u00efa","year":"2022","journal-title":"International Journal of Production Economics"},{"key":"10.1016\/j.cie.2024.110044_b3","series-title":"2022 IEEE international conference on systems, man, and cybernetics","first-page":"3216","article-title":"A Q-learning-based selective disassembly sequence planning method","author":"Bi","year":"2022"},{"key":"10.1016\/j.cie.2024.110044_b4","doi-asserted-by":"crossref","first-page":"684","DOI":"10.1016\/j.procir.2023.02.115","article-title":"Disassembly sequence planning for target parts of end-of-life smartphones using Q-learning algorithm","volume":"116","author":"Chen","year":"2023","journal-title":"Procedia CIRP"},{"key":"10.1016\/j.cie.2024.110044_b5","doi-asserted-by":"crossref","DOI":"10.1177\/09544054221136526","article-title":"Disassembly leveling and lot-sizing for multiple product types with uncertain component demands","author":"Choi","year":"2023","journal-title":"Proceedings of the Institution of Mechanical Engineers, Part B (Management and Engineering Manufacture)"},{"key":"10.1016\/j.cie.2024.110044_b6","article-title":"Disassembly leveling and lot-sizing for multiple product types with uncertain component demands","author":"Choi","year":"2024","journal-title":"Proceedings of the Institution of Mechanical Engineers, Part B (Management and Engineering Manufacture)"},{"key":"10.1016\/j.cie.2024.110044_b7","series-title":"High-end displays to be a third of TV displays in 2025","author":"Compound Semiconductor","year":"2021"},{"issue":"1","key":"10.1016\/j.cie.2024.110044_b8","doi-asserted-by":"crossref","DOI":"10.1049\/cim2.12074","article-title":"Robotic disassembly sequence planning considering parts failure features","volume":"5","author":"Cui","year":"2023","journal-title":"IET Collaborative Intelligent Manufacturing"},{"key":"10.1016\/j.cie.2024.110044_b9","series-title":"The global commitment 2022","author":"Ellen MacArthur Foundation","year":"2022"},{"key":"10.1016\/j.cie.2024.110044_b10","series-title":"The global market for nanotechnology and engineered nanomaterials (ENM) to 2033 markets, applications, production and producers","author":"Future Markets Inc","year":"2022"},{"key":"10.1016\/j.cie.2024.110044_b11","series-title":"2015 international conference on industrial engineering and systems management","first-page":"1329","article-title":"Metaheuristic based optimization for capacitated disassembly lot sizing problem with lost sales","author":"Godichaud","year":"2015"},{"key":"10.1016\/j.cie.2024.110044_b12","first-page":"1","article-title":"Reinforcement learning for disassembly system optimization problems: A survey","author":"Guo","year":"2023","journal-title":"International Journal of Network Dynamics and Intelligence"},{"issue":"2","key":"10.1016\/j.cie.2024.110044_b13","doi-asserted-by":"crossref","first-page":"165","DOI":"10.1289\/ehp.8284","article-title":"A toxicologic review of quantum dots: toxicity depends on physicochemical and environmental factors","volume":"114","author":"Hardman","year":"2006","journal-title":"Environmental Health Perspectives"},{"issue":"1","key":"10.1016\/j.cie.2024.110044_b14","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1109\/TITS.2020.3008612","article-title":"Deep reinforcement learning for intelligent transportation systems: A survey","volume":"23","author":"Haydari","year":"2022","journal-title":"IEEE Transactions on Intelligent Transportation Systems"},{"issue":"4","key":"10.1016\/j.cie.2024.110044_b15","doi-asserted-by":"crossref","first-page":"1225","DOI":"10.1080\/00207543.2015.1058536","article-title":"Capacitated disassembly scheduling with parts commonality and start-up cost and its industrial application","volume":"54","author":"Ji","year":"2016","journal-title":"International Journal of Production Research"},{"key":"10.1016\/j.cie.2024.110044_b16","doi-asserted-by":"crossref","first-page":"1463","DOI":"10.1007\/s00170-012-4570-9","article-title":"Disassembly leveling and lot sizing for multiple product types: a basic model and its extension","volume":"82","author":"Kang","year":"2016","journal-title":"International Journal of Advanced Manufacturing Technology"},{"issue":"5","key":"10.1016\/j.cie.2024.110044_b17","doi-asserted-by":"crossref","first-page":"867","DOI":"10.1177\/0954405416661001","article-title":"Multi-period disassembly levelling and lot-sizing for multiple product types with parts commonality","volume":"232","author":"Kim","year":"2018","journal-title":"Proceedings of the Institution of Mechanical Engineers, Part B (Management and Engineering Manufacture)"},{"key":"10.1016\/j.cie.2024.110044_b18","doi-asserted-by":"crossref","first-page":"225","DOI":"10.1016\/j.promfg.2020.01.030","article-title":"Towards a robot simulation framework for e-waste disassembly using reinforcement learning","volume":"38","author":"Kristensen","year":"2019","journal-title":"Procedia Manufacturing"},{"key":"10.1016\/j.cie.2024.110044_b19","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1016\/j.cirpj.2022.11.003","article-title":"Deep reinforcement learning in smart manufacturing: A review and prospects","volume":"40","author":"Li","year":"2023","journal-title":"CIRP Journal of Manufacturing Science and Technology"},{"key":"10.1016\/j.cie.2024.110044_b20","series-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015"},{"issue":"11\u201312","key":"10.1016\/j.cie.2024.110044_b21","doi-asserted-by":"crossref","first-page":"3533","DOI":"10.1007\/s00170-021-07265-2","article-title":"Task-level decision-making for dynamic and stochastic human-robot collaboration based on dual agents deep reinforcement learning","volume":"115","author":"Liu","year":"2021","journal-title":"International Journal of Advanced Manufacturing Technology"},{"issue":"12","key":"10.1016\/j.cie.2024.110044_b22","doi-asserted-by":"crossref","first-page":"4027","DOI":"10.1080\/00207543.2019.1578906","article-title":"Human-robot collaboration in disassembly for sustainable manufacturing","volume":"57","author":"Liu","year":"2019","journal-title":"International Journal of Production Research"},{"issue":"1","key":"10.1016\/j.cie.2024.110044_b23","doi-asserted-by":"crossref","first-page":"244","DOI":"10.1016\/j.ejor.2017.08.032","article-title":"Capacitated disassembly scheduling under stochastic yield and demand","volume":"269","author":"Liu","year":"2018","journal-title":"European Journal of Operational Research"},{"key":"10.1016\/j.cie.2024.110044_b24","series-title":"2022 IEEE international conference on systems, man, and cybernetics","first-page":"568","article-title":"An improved Q-learning algorithm for human-robot collaboration two-sided disassembly line balancing problems","author":"Liu","year":"2022"},{"key":"10.1016\/j.cie.2024.110044_b25","first-page":"1","article-title":"Adaptive disassembly sequence planning for VR maintenance training via deep reinforcement learning","author":"Mao","year":"2021","journal-title":"International Journal of Advanced Manufacturing Technology"},{"key":"10.1016\/j.cie.2024.110044_b26","series-title":"2021 international conference on information technology","first-page":"424","article-title":"A reinforcement learning approach for disassembly line balancing problem","author":"Mete","year":"2021"},{"issue":"7540","key":"10.1016\/j.cie.2024.110044_b27","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"Mnih","year":"2015","journal-title":"Nature"},{"key":"10.1016\/j.cie.2024.110044_b28","series-title":"Monthly global climate report for annual 2021","author":"NOAA National Centers for Environmental Information","year":"2022"},{"issue":"2","key":"10.1016\/j.cie.2024.110044_b29","doi-asserted-by":"crossref","first-page":"10682","DOI":"10.1016\/j.ifacol.2020.12.2840","article-title":"Disassembly lot sizing problem with disposal decisions for multiple product types with parts commonality","volume":"53","author":"Pour-Massahian-Tafti","year":"2020","journal-title":"IFAC-PapersOnLine"},{"issue":"22","key":"10.1016\/j.cie.2024.110044_b30","doi-asserted-by":"crossref","first-page":"6898","DOI":"10.1080\/00207543.2020.1829148","article-title":"New models and efficient methods for single-product disassembly lot-sizing problem with surplus inventory decisions","volume":"59","author":"Pour-Massahian-Tafti","year":"2021","journal-title":"International Journal of Production Research"},{"key":"10.1016\/j.cie.2024.110044_b31","series-title":"Stable baselines3","author":"Raffin","year":"2019"},{"key":"10.1016\/j.cie.2024.110044_b32","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2022.105676","article-title":"Integrated lot-sizing and scheduling: Mitigation of uncertainty in demand and processing time by machine learning","volume":"118","author":"Rohaninejad","year":"2023","journal-title":"Engineering Applications of Artificial Intelligence"},{"key":"10.1016\/j.cie.2024.110044_b33","series-title":"International conference on machine learning","first-page":"1889","article-title":"Trust region policy optimization","author":"Schulman","year":"2015"},{"key":"10.1016\/j.cie.2024.110044_b34","series-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"issue":"2","key":"10.1016\/j.cie.2024.110044_b35","doi-asserted-by":"crossref","DOI":"10.1016\/j.jjimei.2022.100094","article-title":"How are reinforcement learning and deep learning algorithms used for big data based decision making in financial industries\u2013A review and research agenda","volume":"2","author":"Singh","year":"2022","journal-title":"International Journal of Information Management Data Insights"},{"key":"10.1016\/j.cie.2024.110044_b36","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1016\/j.jmsy.2020.05.002","article-title":"New mixed integer approach to solve a multi-level capacitated disassembly lot-sizing problem with defective items and backlogging","volume":"56","author":"Slama","year":"2020","journal-title":"Journal of Manufacturing Systems"},{"key":"10.1016\/j.cie.2024.110044_b37","doi-asserted-by":"crossref","DOI":"10.1016\/j.cie.2021.107468","article-title":"Genetic algorithm and Monte Carlo simulation for a stochastic capacitated disassembly lot-sizing problem under random lead times","volume":"159","author":"Slama","year":"2021","journal-title":"Computers & Industrial Engineering"},{"issue":"13","key":"10.1016\/j.cie.2024.110044_b38","doi-asserted-by":"crossref","first-page":"595","DOI":"10.1016\/j.ifacol.2019.11.224","article-title":"Scenario-based stochastic linear programming model for multi-period disassembly lot-sizing problems under random lead time","volume":"52","author":"Slama","year":"2019","journal-title":"IFAC-PapersOnLine"},{"issue":"3","key":"10.1016\/j.cie.2024.110044_b39","doi-asserted-by":"crossref","first-page":"1183","DOI":"10.1016\/j.ejor.2022.03.025","article-title":"Stochastic program for disassembly lot-sizing under uncertain component refurbishing lead times","volume":"303","author":"Slama","year":"2022","journal-title":"European Journal of Operational Research"},{"key":"10.1016\/j.cie.2024.110044_b40","series-title":"Reinforcement learning: An introduction","author":"Sutton","year":"2018"},{"key":"10.1016\/j.cie.2024.110044_b41","series-title":"2019 IEEE 6th international conference on industrial engineering and applications","first-page":"135","article-title":"Single product disassembly lot sizing problem with disposal","author":"Tafti","year":"2019"},{"key":"10.1016\/j.cie.2024.110044_b42","series-title":"Proc. int. conf. ind. engine","first-page":"1866","article-title":"Inventory management in multi-product multi-demand disassembly line using reinforcement learning","author":"Tuncel","year":"2012"},{"key":"10.1016\/j.cie.2024.110044_b43","doi-asserted-by":"crossref","first-page":"647","DOI":"10.1007\/s10845-012-0711-0","article-title":"Solving large scale disassembly line balancing problem with uncertainty using reinforcement learning","volume":"25","author":"Tuncel","year":"2014","journal-title":"Journal of Intelligent Manufacturing"},{"key":"10.1016\/j.cie.2024.110044_b44","first-page":"30","article-title":"Multi-kanban mechanism for appliance disassembly","volume":"vol. 5997","author":"Udomsawat","year":"2005"},{"key":"10.1016\/j.cie.2024.110044_b45","first-page":"42","article-title":"Controlling disassembly line with multi-kanban system","volume":"vol. 6385","author":"Udomsawat","year":"2006"},{"key":"10.1016\/j.cie.2024.110044_b46","first-page":"85","article-title":"Multikanban model for disassembly line with demand fluctuation","volume":"vol. 5262","author":"Udomsawat","year":"2004"},{"issue":"20","key":"10.1016\/j.cie.2024.110044_b47","doi-asserted-by":"crossref","first-page":"6209","DOI":"10.1080\/00207543.2013.825406","article-title":"Flexible disassembly planning considering product conditions","volume":"51","author":"Ullerich","year":"2013","journal-title":"International Journal of Production Research"},{"key":"10.1016\/j.cie.2024.110044_b48","series-title":"Cleaning up electronic waste (E-Waste)","author":"United States Environmental Protection Agency","year":"2022"},{"key":"10.1016\/j.cie.2024.110044_b49","series-title":"2022 Final list of critical minerals","author":"U.S. Geological Survey Department of the Interior","year":"2022"},{"issue":"2","key":"10.1016\/j.cie.2024.110044_b50","doi-asserted-by":"crossref","first-page":"575","DOI":"10.1007\/s10845-021-01863-3","article-title":"Modelling and condition-based control of a flexible and hybrid disassembly system with manual and autonomous workstations using reinforcement learning","volume":"33","author":"Wurster","year":"2022","journal-title":"Journal of Intelligent Manufacturing"},{"key":"10.1016\/j.cie.2024.110044_b51","first-page":"1","article-title":"Multi-agent reinforcement learning method for disassembly sequential task optimization based on human-robot collaborative disassembly in electric vehicle battery recycling","author":"Xiao","year":"2023","journal-title":"Journal of Manufacturing Science and Engineering"},{"issue":"1","key":"10.1016\/j.cie.2024.110044_b52","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3477600","article-title":"Reinforcement learning in healthcare: A survey","volume":"55","author":"Yu","year":"2021","journal-title":"ACM Computing Surveys"},{"key":"10.1016\/j.cie.2024.110044_b53","series-title":"2022 IEEE international conference on systems, man, and cybernetics","first-page":"872","article-title":"An improved Q-learning algorithm for solving disassembly line balancing problem considering carbon emission","author":"Zhang","year":"2022"},{"issue":"4","key":"10.1016\/j.cie.2024.110044_b54","doi-asserted-by":"crossref","first-page":"7807","DOI":"10.1109\/LRA.2021.3098248","article-title":"Reinforcement learning-based selective disassembly sequence planning for the end-of-life products with structure uncertainty","volume":"6","author":"Zhao","year":"2021","journal-title":"IEEE Robotics and Automation Letters"}],"container-title":["Computers &amp; Industrial Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0360835224001657?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0360835224001657?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,4,30]],"date-time":"2024-04-30T05:23:18Z","timestamp":1714454598000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0360835224001657"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4]]},"references-count":54,"alternative-id":["S0360835224001657"],"URL":"http:\/\/dx.doi.org\/10.1016\/j.cie.2024.110044","relation":{},"ISSN":["0360-8352"],"issn-type":[{"value":"0360-8352","type":"print"}],"subject":[],"published":{"date-parts":[[2024,4]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Reinforcement Learning for Disassembly Task Control","name":"articletitle","label":"Article Title"},{"value":"Computers & Industrial Engineering","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.cie.2024.110044","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2024 The Authors. Published by Elsevier Ltd.","name":"copyright","label":"Copyright"}],"article-number":"110044"}}