{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:32:16Z","timestamp":1757619136145,"version":"3.44.0"},"publisher-location":"Singapore","reference-count":33,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819698172"},{"type":"electronic","value":"9789819698189"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-9818-9_39","type":"book-chapter","created":{"date-parts":[[2025,7,19]],"date-time":"2025-07-19T12:24:29Z","timestamp":1752927869000},"page":"461-479","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Think4CPP: Reinforcement Learning by Thinking with Latent World Model for Safe Coverage Path Planning"],"prefix":"10.1007","author":[{"given":"Zhentang","family":"Liao","sequence":"first","affiliation":[]},{"given":"Meng","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zhongxue","family":"Gan","sequence":"additional","affiliation":[]},{"given":"Lihua","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Zhiyan","family":"Dong","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,20]]},"reference":[{"key":"39_CR1","doi-asserted-by":"crossref","unstructured":"Santos, L.C., Santos, F.N., Pires, E.S., Valente, A., Costa, P., Magalhaes, S.: Path planning for ground robots in agriculture: a short review. In: 2020 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC), pp. 61\u201366. IEEE, New York (2020)","DOI":"10.1109\/ICARSC49921.2020.9096177"},{"key":"39_CR2","doi-asserted-by":"crossref","unstructured":"Bormann, R., Jordan, F., Hampp, J., H\u00e4gele, M.: Indoor coverage path planning: survey, implementation, analysis. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 1718\u20131725. IEEE, New York (2018)","DOI":"10.1109\/ICRA.2018.8460566"},{"issue":"12","key":"39_CR3","doi-asserted-by":"publisher","first-page":"1258","DOI":"10.1016\/j.robot.2013.09.004","volume":"61","author":"E Galceran","year":"2013","unstructured":"Galceran, E., Carreras, M.: A survey on coverage path planning for robotics. Robot. Autonom. Syst. 61(12), 1258\u20131276 (2013)","journal-title":"Robot. Autonom. Syst."},{"issue":"1\u20132","key":"39_CR4","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/S0925-7721(00)00015-8","volume":"17","author":"EM Arkin","year":"2000","unstructured":"Arkin, E.M., Fekete, S.P., Mitchell, J.S.: Approximation algorithms for lawn mowing and milling. Comput. Geometry 17(1\u20132), 25\u201350 (2000)","journal-title":"Comput. Geometry"},{"issue":"2","key":"39_CR5","doi-asserted-by":"publisher","first-page":"5445","DOI":"10.1109\/LRA.2022.3154006","volume":"7","author":"P Maini","year":"2022","unstructured":"Maini, P., Gonultas, B.M., Isler, V.: Online coverage planning for an autonomous weed mowing robot with curvature constraints. IEEE Robot. Autom. Lett. 7(2), 5445\u20135452 (2022)","journal-title":"IEEE Robot. Autom. Lett."},{"key":"39_CR6","doi-asserted-by":"crossref","unstructured":"Jing, W., Deng, D., Xiao, Z., Liu, Y., Shimada, K.: Coverage path planning using path primitive sampling and primitive coverage graph for visual inspection. In: 2019 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 1472\u20131479. IEEE, New York (2019)","DOI":"10.1109\/IROS40897.2019.8967969"},{"key":"39_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2021.107612","volume":"161","author":"SW Cho","year":"2021","unstructured":"Cho, S.W., Park, H.J., Lee, H., Shim, D.H., Kim, S.Y.: Coverage path planning for multiple unmanned aerial vehicles in maritime search and rescue operations. Comput. Industr. Eng. 161, 107612 (2021)","journal-title":"Comput. Industr. Eng."},{"issue":"6","key":"39_CR8","doi-asserted-by":"publisher","first-page":"904","DOI":"10.1017\/S0263574718000139","volume":"36","author":"SM Ahmadi","year":"2018","unstructured":"Ahmadi, S.M., Kebriaei, H., Moradi, H.: Constrained coverage path planning: evolutionary and classical approaches. Robotica 36(6), 904\u2013924 (2018)","journal-title":"Robotica"},{"key":"39_CR9","doi-asserted-by":"crossref","unstructured":"Umari, H., Mukhopadhyay, S.: Autonomous robotic exploration based on multiple rapidly-exploring randomized trees. In: 2017 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 1396\u20131402. IEEE, New York (2017)","DOI":"10.1109\/IROS.2017.8202319"},{"key":"39_CR10","doi-asserted-by":"crossref","unstructured":"Yu, J., Tong, J., Xu, Y., Xu, Z., Dong, H., Yang, T., Wang, Y.: SMMR-Explore: Submap-based multi-robot exploration system with multi-robot multi-target potential field exploration method. In: 2021 IEEE International Conference on Robotics and Automation (ICRA), pp. 8779\u20138785. IEEE, New York (2021)","DOI":"10.1109\/ICRA48506.2021.9561328"},{"issue":"3","key":"39_CR11","doi-asserted-by":"publisher","first-page":"1441","DOI":"10.1109\/TPAMI.2023.3261387","volume":"46","author":"S Baik","year":"2023","unstructured":"Baik, S., Choi, M., Choi, J., Kim, H., Lee, K.M.: Learning to learn task-adaptive hyperparameters for few-shot learning. IEEE Trans. Pattern Analys. Machine Intell. 46(3), 1441\u20131454 (2023)","journal-title":"IEEE Trans. Pattern Analys. Machine Intell."},{"key":"39_CR12","unstructured":"Rothfuss, J., Koenig, C., Rupenyan, A., Krause, A.: Meta-learning priors for safe Bayesian optimization. In: Conference on Robot Learning (CoRL), pp. 237\u2013265. PMLR (2023)"},{"key":"39_CR13","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1007\/s10846-019-01073-3","volume":"98","author":"C Yan","year":"2020","unstructured":"Yan, C., Xiang, X., Wang, C.: Towards real-time path planning through deep reinforcement learning for a UAV in dynamic environments. J. Intell. Robot. Syst. 98, 297\u2013309 (2020)","journal-title":"J. Intell. Robot. Syst."},{"key":"39_CR14","doi-asserted-by":"crossref","unstructured":"Smith, L., Cao, Y., Levine, S.: Grow your limits: Continuous improvement with real-world RL for robotic locomotion. In: 2024 IEEE International Conference on Robotics and Automation (ICRA), pp. 10829\u201310836. IEEE, New York (2024)","DOI":"10.1109\/ICRA57147.2024.10610485"},{"key":"39_CR15","unstructured":"Stachowicz, K., Shah, D., Bhorkar, A., Kostrikov, I., Levine, S.: FastRLAP: A system for learning high-speed driving via deep RL and autonomous practicing. In: Conference on Robot Learning (CoRL), pp. 3100\u20133111. PMLR (2023)"},{"key":"39_CR16","doi-asserted-by":"crossref","unstructured":"Theile, M., Bayerlein, H., Nai, R., Gesbert, D., Caccamo, M.: UAV coverage path planning under varying power constraints using deep reinforcement learning. In: 2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 1444\u20131449. IEEE, New York (2020)","DOI":"10.1109\/IROS45743.2020.9340934"},{"key":"39_CR17","unstructured":"Han, K., Xiao, A., Wu, E., Guo, J., Xu, C., Wang, Y.: Transformer in transformer. In: Proceedings of the 34th Conference on Neural Information Processing Systems (NeurIPS 2021), pp. 15908\u201315919 (2021)"},{"key":"39_CR18","doi-asserted-by":"crossref","unstructured":"Choset, H., Pignon, P.: Coverage path planning: The boustrophedon cellular decomposition. In: Field and Service Robotics, pp. 203\u2013209. Springer, London (1998)","DOI":"10.1007\/978-1-4471-1273-0_32"},{"issue":"4","key":"39_CR19","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1177\/027836402320556359","volume":"21","author":"EU Acar","year":"2002","unstructured":"Acar, E.U., Choset, H., Rizzi, A.A., Atkar, P.N., Hull, D.: Morse decompositions for coverage tasks. Int. J. Robot. Res. 21(4), 331\u2013344 (2002)","journal-title":"Int. J. Robot. Res."},{"key":"39_CR20","doi-asserted-by":"crossref","unstructured":"Gabriely, Y., Rimon, E.: Spiral-STC: An on-line coverage algorithm of grid environments by a mobile robot. In: Proceedings of the 2002 IEEE International Conference on Robotics and Automation (ICRA), vol. 1, pp. 954\u2013960. IEEE, New York (2002)","DOI":"10.1109\/ROBOT.2002.1013479"},{"key":"39_CR21","doi-asserted-by":"crossref","unstructured":"Gonzalez, E., Alvarez, O., Diaz, Y., Parra, C., Bustacara, C.: BSA: A complete coverage algorithm. In: Proceedings of the 2005 IEEE International Conference on Robotics and Automation (ICRA), pp. 2040\u20132044. IEEE, New York (2005)","DOI":"10.1109\/ROBOT.2005.1570413"},{"key":"39_CR22","unstructured":"Zelinsky, A., Jarvis, R.A., Byrne, J.C., Yuta, S.: Planning paths of complete coverage of an unstructured environment by a mobile robot. In: Proceedings of the 13th International Conference on Advanced Robotics (ICAR), vol. 13, pp. 533\u2013538. Citeseer (1993)"},{"issue":"3","key":"39_CR23","doi-asserted-by":"publisher","first-page":"718","DOI":"10.1109\/TIE.2004.825197","volume":"51","author":"JS Oh","year":"2004","unstructured":"Oh, J.S., Choi, Y.H., Park, J.B., Zheng, Y.F.: Complete coverage navigation of cleaning robots using triangular-cell-based map. IEEE Trans. Industr. Electron. 51(3), 718\u2013726 (2004)","journal-title":"IEEE Trans. Industr. Electron."},{"key":"39_CR24","unstructured":"Yamauchi, B.: A frontier-based approach for autonomous exploration. In: Proceedings of the 1997 IEEE International Symposium on Computational Intelligence in Robotics and Automation (CIRA), pp. 146\u2013151. IEEE, New York (1997)"},{"key":"39_CR25","doi-asserted-by":"crossref","unstructured":"Chen, X., Tucker, T.M., Kurfess, T.R., Vuduc, R.: Adaptive deep path: Efficient coverage of a known environment under various configurations. In: 2019 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 3549\u20133556. IEEE, New York (2019)","DOI":"10.1109\/IROS40897.2019.8967793"},{"key":"39_CR26","doi-asserted-by":"crossref","unstructured":"Piardi, L., Lima, J., Pereira, A.I., Costa, P.: Coverage path planning optimization based on Q-learning algorithm. In: AIP Conference Proceedings, vol. 2116, no. 1. AIP Publishing, Melville (2019)","DOI":"10.1063\/1.5114220"},{"key":"39_CR27","doi-asserted-by":"publisher","first-page":"225945","DOI":"10.1109\/ACCESS.2020.3045027","volume":"8","author":"PT Kyaw","year":"2020","unstructured":"Kyaw, P.T., Paing, A., Thu, T.T., Mohan, R.E., Le, A.V., Veerajagadheswar, P.: Coverage path planning for decomposition reconfigurable grid-maps using deep reinforcement learning based travelling salesman problem. IEEE Access 8, 225945\u2013225956 (2020)","journal-title":"IEEE Access"},{"key":"39_CR28","unstructured":"Jonnarth, A., Zhao, J., Felsberg, M.: Learning coverage paths in unknown environments with deep reinforcement learning. In: International Conference on Machine Learning (ICML), pp. 22491\u201322508. PMLR (2024)"},{"key":"39_CR29","unstructured":"Haarnoja, T., Zhou, A., Abbeel, P., Levine, S.: Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor. In: International Conference on Machine Learning (ICML), pp. 1861\u20131870. PMLR (2018)"},{"issue":"2","key":"39_CR30","doi-asserted-by":"publisher","first-page":"610","DOI":"10.1109\/LRA.2019.2891991","volume":"4","author":"F Niroui","year":"2019","unstructured":"Niroui, F., Zhang, K., Kashino, Z., Nejat, G.: Deep reinforcement learning robot for search and rescue applications: Exploration in unknown cluttered environments. IEEE Robot. Autom. Lett. 4(2), 610\u2013617 (2019)","journal-title":"IEEE Robot. Autom. Lett."},{"issue":"12","key":"39_CR31","doi-asserted-by":"publisher","first-page":"14413","DOI":"10.1109\/TVT.2020.3034800","volume":"69","author":"J Hu","year":"2020","unstructured":"Hu, J., Niu, H., Carrasco, J., Lennox, B., Arvin, F.: Voronoi-based multi-robot autonomous exploration in unknown environments via deep reinforcement learning. IEEE Trans. Vehicular Technol. 69(12), 14413\u201314423 (2020)","journal-title":"IEEE Trans. Vehicular Technol."},{"key":"39_CR32","doi-asserted-by":"crossref","unstructured":"Xu, Y., Yu, J., Tang, J., Qiu, J., Wang, J., Shen, Y., Wang, Y., Yang, H.: Explore-Bench: Data sets, metrics and evaluations for frontier-based and deep-reinforcement-learning-based autonomous exploration. In: 2022 IEEE International Conference on Robotics and Automation (ICRA), pp. 6225\u20136231. IEEE, New York (2022)","DOI":"10.1109\/ICRA46639.2022.9812344"},{"key":"39_CR33","doi-asserted-by":"crossref","unstructured":"Klamt, T., Behnke, S.: Planning hybrid driving-stepping locomotion on multiple levels of abstraction. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 1695\u20131702. IEEE, New York (2018)","DOI":"10.1109\/ICRA.2018.8461054"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-9818-9_39","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T14:55:50Z","timestamp":1757256950000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-9818-9_39"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819698172","9789819698189"],"references-count":33,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-9818-9_39","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"20 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}