{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T14:49:43Z","timestamp":1781621383258,"version":"3.54.5"},"reference-count":46,"publisher":"Informa UK Limited","issue":"8","funder":[{"DOI":"10.13039\/501100003472","name":"Harbin Institute of Technology","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003472","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62188101, 62303135"],"award-info":[{"award-number":["62188101, 62303135"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62320106001"],"award-info":[{"award-number":["62320106001"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["www.tandfonline.com"],"crossmark-restriction":true},"short-container-title":["International Journal of Systems Science"],"published-print":{"date-parts":[[2026,6,11]]},"DOI":"10.1080\/00207721.2025.2558132","type":"journal-article","created":{"date-parts":[[2025,10,14]],"date-time":"2025-10-14T01:30:35Z","timestamp":1760405435000},"page":"2360-2375","update-policy":"https:\/\/doi.org\/10.1080\/tandf_crossmark_01","source":"Crossref","is-referenced-by-count":1,"title":["An improved Q-learning algorithm for search and rescue UGV path planning in unknown environments"],"prefix":"10.1080","volume":"57","author":[{"given":"Shanfan","family":"Zhang","sequence":"first","affiliation":[{"name":"Harbin Institute of Technology","place":["Harbin, People's Republic of China"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qingshuang","family":"Zeng","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology","place":["Harbin, People's Republic of China"]}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Zeng","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology","place":["Harbin, People's Republic of China"]}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"301","published-online":{"date-parts":[[2025,10,13]]},"reference":[{"key":"e_1_3_5_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2018.2838556"},{"key":"e_1_3_5_3_1","doi-asserted-by":"publisher","DOI":"10.1108\/GS-11-2019-0050"},{"key":"e_1_3_5_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2021.3081996"},{"key":"e_1_3_5_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3379804"},{"key":"e_1_3_5_6_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11633-024-1512-6"},{"key":"e_1_3_5_7_1","doi-asserted-by":"publisher","DOI":"10.1016\/jproeng.2014.12.098"},{"key":"e_1_3_5_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.123978"},{"key":"e_1_3_5_9_1","doi-asserted-by":"publisher","DOI":"10.1108\/GS-10-2015-0073"},{"key":"e_1_3_5_10_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2023.113632"},{"key":"e_1_3_5_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CCDC.2015.7161932"},{"key":"e_1_3_5_12_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.114898"},{"key":"e_1_3_5_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASE.2021.3062810"},{"issue":"2","key":"e_1_3_5_14_1","first-page":"112","article-title":"A novel grey decision making model and its numerical simulation","volume":"29","author":"Jie C.","year":"2012","unstructured":"Jie, C., Sifeng, L., & Naiming, X. (2012). A novel grey decision making model and its numerical simulation. Transactions of Nanjing University of Aeronautics and Astronautics, 29(2), 112\u2013117.","journal-title":"Transactions of Nanjing University of Aeronautics and Astronautics"},{"key":"e_1_3_5_15_1","unstructured":"Jonnarth A. Zhao J. & Felsberg M. (2023). End-to-end reinforcement learning for online coverage path planning in unknown environments. ArXiv abs\/2306.16978."},{"key":"e_1_3_5_16_1","unstructured":"Jonnarth A. Zhao J. & Felsberg M. (2024). Learning coverage paths in unknown environments with deep reinforcement learning. In Proceedings of the 41st International Conference on Machine Learning (ICML'24). 903. https:\/\/openreview.net\/forum?id=nCZYRBK1J4."},{"key":"e_1_3_5_17_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6911(82)80025-X"},{"key":"e_1_3_5_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCA.2012.2227719"},{"key":"e_1_3_5_19_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2007.12.002"},{"key":"e_1_3_5_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/GSIS.2015.7301887"},{"key":"e_1_3_5_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICMA.2014.6885732"},{"key":"e_1_3_5_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CHICC.2006.4346989"},{"issue":"2","key":"e_1_3_5_23_1","first-page":"178","article-title":"The three axioms of buffer operator and their application","volume":"1","author":"Liu S.","year":"1991","unstructured":"Liu, S. (1991). The three axioms of buffer operator and their application. The Journal of Grey System, 1(2), 178\u2013185.","journal-title":"The Journal of Grey System"},{"key":"e_1_3_5_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/CCDC58219.2023.10326951"},{"key":"e_1_3_5_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/GSIS.2015.7301810"},{"issue":"1","key":"e_1_3_5_26_1","first-page":"1","article-title":"On uniform effect measure functions and a weighted multi-attribute grey target decision model","volume":"25","author":"Liu S.","year":"2013","unstructured":"Liu, S., Xu, B., Forrest, J., Chen, Y., & Yang, Y. (2013). On uniform effect measure functions and a weighted multi-attribute grey target decision model. Journal of Grey System, 25(1), 1\u201311.","journal-title":"Journal of Grey System"},{"issue":"8","key":"e_1_3_5_27_1","first-page":"1159","article-title":"Multi-attribute intelligent grey target decision model","volume":"25","author":"Liu S.","year":"2010","unstructured":"Liu, S., Yuan, W., & Sheng, K. (2010). Multi-attribute intelligent grey target decision model. Control and Decision, 25(8), 1159\u20131163.","journal-title":"Control and Decision"},{"key":"e_1_3_5_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3379840"},{"key":"e_1_3_5_29_1","doi-asserted-by":"publisher","DOI":"10.3390\/rs15133266"},{"key":"e_1_3_5_30_1","doi-asserted-by":"publisher","DOI":"10.1177\/0278364918772024"},{"key":"e_1_3_5_31_1","doi-asserted-by":"publisher","DOI":"10.4108\/airo.v2i1.3056"},{"key":"e_1_3_5_32_1","doi-asserted-by":"publisher","DOI":"10.64820\/AEPJRR.11.7.14.122024"},{"issue":"1","key":"e_1_3_5_33_1","first-page":"93","article-title":"Discrete GM(1,1) and mechanism of grey forecasting model","volume":"25","author":"Naiming X.","year":"2005","unstructured":"Naiming, X., & Sifeng, L. (2005). Discrete GM(1,1) and mechanism of grey forecasting model. System Engineering Theory and Practice, 25(1), 93\u201399.","journal-title":"System Engineering Theory and Practice"},{"key":"e_1_3_5_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2019.2903261"},{"key":"e_1_3_5_35_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.aei.2025.103124"},{"key":"e_1_3_5_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/JSYST.2020.3027585"},{"key":"e_1_3_5_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICECTT.2015.65"},{"key":"e_1_3_5_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3382530"},{"key":"e_1_3_5_39_1","doi-asserted-by":"publisher","DOI":"10.1108\/GS-04-2017-0010"},{"key":"e_1_3_5_40_1","doi-asserted-by":"publisher","DOI":"10.1108\/20439371111163783"},{"key":"e_1_3_5_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2020.3031962"},{"key":"e_1_3_5_42_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cnsns.2012.11.017"},{"key":"e_1_3_5_43_1","doi-asserted-by":"publisher","DOI":"10.3390\/s21041076"},{"key":"e_1_3_5_44_1","doi-asserted-by":"publisher","DOI":"10.1108\/GS-10-2016-0040"},{"key":"e_1_3_5_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCECE58074.2023.10135199"},{"key":"e_1_3_5_46_1","doi-asserted-by":"publisher","DOI":"10.3390\/app14199127"},{"key":"e_1_3_5_47_1","doi-asserted-by":"publisher","DOI":"10.1007\/s40430-023-04570-7"}],"container-title":["International Journal of Systems Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.tandfonline.com\/doi\/pdf\/10.1080\/00207721.2025.2558132","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,18]],"date-time":"2026-05-18T15:19:51Z","timestamp":1779117591000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.tandfonline.com\/doi\/full\/10.1080\/00207721.2025.2558132"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,13]]},"references-count":46,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2026,6,11]]}},"alternative-id":["10.1080\/00207721.2025.2558132"],"URL":"https:\/\/doi.org\/10.1080\/00207721.2025.2558132","relation":{},"ISSN":["0020-7721","1464-5319"],"issn-type":[{"value":"0020-7721","type":"print"},{"value":"1464-5319","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,13]]},"assertion":[{"value":"The publishing and review policy for this title is described in its Aims & Scope.","order":1,"name":"peerreview_statement","label":"Peer Review Statement"},{"value":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tsys20","URL":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tsys20","order":2,"name":"aims_and_scope_url","label":"Aim & Scope"},{"value":"2025-04-15","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-08-30","order":2,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-10-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}