{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T23:28:41Z","timestamp":1769556521456,"version":"3.49.0"},"publisher-location":"Cham","reference-count":21,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319938172","type":"print"},{"value":"9783319938189","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-93818-9_10","type":"book-chapter","created":{"date-parts":[[2018,6,15]],"date-time":"2018-06-15T18:47:06Z","timestamp":1529088426000},"page":"102-111","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":27,"title":["Deep-Sarsa Based Multi-UAV Path Planning and Obstacle Avoidance in a Dynamic Environment"],"prefix":"10.1007","author":[{"given":"Wei","family":"Luo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qirong","family":"Tang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Changhong","family":"Fu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peter","family":"Eberhard","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,6,16]]},"reference":[{"key":"10_CR1","doi-asserted-by":"crossref","unstructured":"Gan, S.K., Sukkarieh, S.: Multi-UAV target search using explicit decentralized gradient-based negotiation. In: IEEE International Conference on Robotics and Automation (ICRA), Shanghai, China, pp. 751\u2013756 (2011)","DOI":"10.1109\/ICRA.2011.5979704"},{"key":"10_CR2","doi-asserted-by":"crossref","unstructured":"Fu, C., Carrio, A., Campoy, P.: Efficient visual odometry and mapping for unmanned aerial vehicle using ARM-based stereo vision pre-processing system. In: International Conference on Unmanned Aircraft Systems (ICUAS), Colorado, USA, pp. 957\u2013962 (2015)","DOI":"10.1109\/ICUAS.2015.7152384"},{"issue":"1","key":"10_CR3","first-page":"417","volume":"57","author":"I Maza","year":"2009","unstructured":"Maza, I., Kondak, K., Bernard, M., Ollero, A.: Multi-UAV cooperation and control for load transportation and deployment. J. Intell. Robot. Syst. 57(1), 417\u2013449 (2009)","journal-title":"J. Intell. Robot. Syst."},{"key":"10_CR4","doi-asserted-by":"crossref","unstructured":"Fu, C., Carrio, A., Olivares-Mendez, M.A., Suarez-Fernandez, R., Campoy, P.: Robust real-time vision-based aircraft tracking from unmanned aerial vehicles. In: IEEE International Conference on Robotics and Automation (ICRA) (2014)","DOI":"10.1109\/ICRA.2014.6907659"},{"key":"10_CR5","doi-asserted-by":"crossref","unstructured":"Hayat, S., Yanmaz, E., Brown, T.X., Bettstetter, C.: Multi-objective UAV path planning for search and rescue. In: IEEE International Conference on Robotics and Automation (ICRA), Singapore, pp. 5569\u20135574 (2017)","DOI":"10.1109\/ICRA.2017.7989656"},{"issue":"3","key":"10_CR6","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/s10700-008-9035-0","volume":"7","author":"BM Sathyaraj","year":"2008","unstructured":"Sathyaraj, B.M., Jain, L.C., Finn, A., Drake, S.: Multiple UAVs path planning algorithms: a comparative study. Fuzzy Optim. Decis. Mak. 7(3), 257\u2013267 (2008)","journal-title":"Fuzzy Optim. Decis. Mak."},{"key":"10_CR7","doi-asserted-by":"crossref","unstructured":"Hrabar, S.: 3D path planning and stereo-based obstacle avoidance for rotorcraft UAVs. In: IEEE\/RSJ International Conference on Intelligent Robots and Systems, Nice, France, pp. 807\u2013814 (2008)","DOI":"10.1109\/IROS.2008.4650775"},{"key":"10_CR8","doi-asserted-by":"crossref","unstructured":"Bounini, F., Gingras, D., Pollart, H., Gruyer, D.: Modified artificial potential field method for online path planning applications. In: IEEE Intelligent Vehicles Symposium (IV), Los Angeles, USA, pp. 180\u2013185 (2017)","DOI":"10.1109\/IVS.2017.7995717"},{"issue":"12","key":"10_CR9","doi-asserted-by":"publisher","first-page":"1258","DOI":"10.1016\/j.robot.2013.09.004","volume":"61","author":"E Galceran","year":"2013","unstructured":"Galceran, E., Carreras, M.: A survey on coverage path planning for robotics. Robot. Auton. Syst. 61(12), 1258\u20131276 (2013)","journal-title":"Robot. Auton. Syst."},{"key":"10_CR10","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zheng, Z., Zhang, X., Liu, Y.: Q learning algorithm based UAV path learning and obstacle avoidence approach. In: 36th Chinese Control Conference (CCC), Dalian, China, pp. 3397\u20133402 (2017)","DOI":"10.23919\/ChiCC.2017.8027884"},{"key":"10_CR11","doi-asserted-by":"crossref","unstructured":"Imanberdiyev, N., Fu, C., Kayacan, E., Chen, I.-M.: Autonomous navigation of UAV by using real-time model-based reinforcement learning. In: 14th International Conference on Control, Automation, Robotics and Vision, Phuket, Thailand, pp. 1\u20136 (2016)","DOI":"10.1109\/ICARCV.2016.7838739"},{"key":"10_CR12","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1007\/978-3-319-63913-0_17","volume-title":"An Introduction to Machine Learning","author":"Miroslav Kubat","year":"2017","unstructured":"Kubat, M.: Reinforcement learning. In: An Introduction to Machine Learning, pp. 331\u2013339 (2017)"},{"key":"10_CR13","doi-asserted-by":"crossref","unstructured":"Zhao, D., Wang, H., Shao, K., Zhu, Y.: Deep reinforcement learning with experience replay based on SARSA. In: IEEE Symposium Series on Computational Intelligence (SSCI) (2016)","DOI":"10.1109\/SSCI.2016.7849837"},{"key":"10_CR14","unstructured":"Quigley, M., Conley, K., Gerkey, B., Faust, J., Foote, T., Leibs, J., Wheeler, R., Ng, A.Y.: ROS: an open-source robot operating system. In: ICRA Workshop on Open Source Software, Kobe, Japan, pp. 1\u20136 (2009)"},{"key":"10_CR15","doi-asserted-by":"crossref","unstructured":"Koenig, N., Howard, A.: Design and use paradigms for Gazebo, an open-source multi-robot simulator. In: IEEE\/RSJ International Conference on Intelligent Robots and Systems, Sendai, Japan, vol. 3, pp. 2149\u20132154 (2004)","DOI":"10.1109\/IROS.2004.1389727"},{"issue":"11","key":"10_CR16","doi-asserted-by":"publisher","first-page":"1238","DOI":"10.1177\/0278364913495721","volume":"32","author":"J Kober","year":"2013","unstructured":"Kober, J., Bagnell, J.A., Peters, J.: Reinforcement learning in robotics: a survey. Int. J. Robot. Res. 32(11), 1238\u20131274 (2013)","journal-title":"Int. J. Robot. Res."},{"issue":"3","key":"10_CR17","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1007\/978-981-10-7515-5_11","volume":"38","author":"S Singh","year":"2000","unstructured":"Singh, S., Jaakkola, T., Littman, M.L., Szepesv\u00e1ri, C.: Convergence results for single-step on-policy reinforcement-learning algorithms. Mach. Learn. 38(3), 287\u2013308 (2000). https:\/\/doi.org\/10.1007\/978-981-10-7515-5_11","journal-title":"Mach. Learn."},{"key":"10_CR18","unstructured":"Sutton, R.S.: Generalization in reinforcement learning: successful examples using sparse coarse coding. In: Touretzky, D.S., Mozer, M.C., Hasselmo, M.E. (eds.) Advances in Neural Information Processing Systems, pp. 1038\u20131044. MIT Press (1996)"},{"issue":"7540","key":"10_CR19","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih, V., Kavukcuoglu, K., Silver, D., Rusu, A.A., Veness, J., Bellemare, M.G., Graves, A., Riedmiller, M., Fidjeland, A.K., Ostrovski, G., Petersen, S., Beattie, C., Sadik, A., Antonoglou, I., King, H., Kumaran, D., Wierstra, D., Legg, S., Hassabis, D.: Human-level control through deep reinforcement learning. Nature 518(7540), 529\u2013533 (2015)","journal-title":"Nature"},{"key":"10_CR20","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1007\/978-1-4842-2766-4_7","volume-title":"Deep Learning with Python","author":"Nikhil Ketkar","year":"2017","unstructured":"Ketkar, N.: Introduction to keras. In: Deep Learning with Python, pp. 97\u2013111 (2017)"},{"key":"10_CR21","doi-asserted-by":"crossref","unstructured":"Huang, A.S., Olson, E., Moore, D.C.: LCM: lightweight communications and marshalling. In: IEEE\/RSJ International Conference on Intelligent Robots and Systems, Taipei, Taiwan, pp. 4057\u20134062 (2010)","DOI":"10.1109\/IROS.2010.5649358"}],"container-title":["Lecture Notes in Computer Science","Advances in Swarm Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-93818-9_10","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,5]],"date-time":"2025-07-05T04:30:33Z","timestamp":1751689833000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-93818-9_10"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319938172","9783319938189"],"references-count":21,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-93818-9_10","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"16 June 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}