{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,11]],"date-time":"2025-12-11T20:57:58Z","timestamp":1765486678676,"version":"3.40.3"},"publisher-location":"Cham","reference-count":23,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030890285"},{"type":"electronic","value":"9783030890292"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-89029-2_39","type":"book-chapter","created":{"date-parts":[[2021,10,11]],"date-time":"2021-10-11T05:09:24Z","timestamp":1633928964000},"page":"504-516","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Resilient Navigation Among Dynamic Agents with Hierarchical Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Sijia","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hao","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhaoqi","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,10,11]]},"reference":[{"key":"39_CR1","unstructured":"Bacon, P., Harb, J., Precup, D.: The option-critic architecture. CoRR abs\/1609.05140 (2016)"},{"key":"39_CR2","doi-asserted-by":"crossref","unstructured":"Van den Berg, J., Lin, M., Manocha, D.: Reciprocal velocity obstacles for real-time multi-agent navigation. In: 2008 IEEE International Conference on Robotics and Automation, pp. 1928\u20131935. IEEE (2008)","DOI":"10.1109\/ROBOT.2008.4543489"},{"key":"39_CR3","doi-asserted-by":"crossref","unstructured":"Chen, C., Hu, S., Nikdel, P., Mori, G., Savva, M.: Relational graph learning for crowd navigation. arXiv preprint arXiv:1909.13165 (2019)","DOI":"10.1109\/IROS45743.2020.9340705"},{"key":"39_CR4","doi-asserted-by":"crossref","unstructured":"Chen, C., Liu, Y., Kreiss, S., Alahi, A.: Crowd-robot interaction: crowd-aware robot navigation with attention-based deep reinforcement learning. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 6015\u20136022. IEEE (2019)","DOI":"10.1109\/ICRA.2019.8794134"},{"key":"39_CR5","doi-asserted-by":"crossref","unstructured":"Chen, Y.F., Liu, M., Everett, M., How, J.P.: Decentralized non-communicating multiagent collision avoidance with deep reinforcement learning. In: 2017 IEEE International Conference on Robotics and Automation (ICRA), pp. 285\u2013292. IEEE (2017)","DOI":"10.1109\/ICRA.2017.7989037"},{"key":"39_CR6","doi-asserted-by":"crossref","unstructured":"Fahad, M., Chen, Z., Guo, Y.: Learning how pedestrians navigate: A deep inverse reinforcement learning approach. In: 2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 819\u2013826. IEEE (2018)","DOI":"10.1109\/IROS.2018.8593438"},{"key":"39_CR7","doi-asserted-by":"crossref","unstructured":"Fan, T., Long, P., Liu, W., Pan, J., Yang, R., Manocha, D.: Learning resilient behaviors for navigation under uncertainty. In: 2020 IEEE International Conference on Robotics and Automation (ICRA), pp. 5299\u20135305. IEEE (2020)","DOI":"10.1109\/ICRA40945.2020.9196785"},{"issue":"8","key":"39_CR8","doi-asserted-by":"publisher","first-page":"1543","DOI":"10.1007\/s10514-018-9719-4","volume":"42","author":"J Godoy","year":"2018","unstructured":"Godoy, J., Chen, T., Guy, S.J., Karamouzas, I., Gini, M.: ALAN: adaptive learning for multi-agent navigation. Autonomous Robots 42(8), 1543\u20131562 (2018)","journal-title":"Autonomous Robots"},{"issue":"6803","key":"39_CR9","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1038\/35035023","volume":"407","author":"D Helbing","year":"2000","unstructured":"Helbing, D., Farkas, I., Vicsek, T.: Simulating dynamical features of escape panic. Nature 407(6803), 487\u2013490 (2000)","journal-title":"Nature"},{"issue":"5","key":"39_CR10","doi-asserted-by":"publisher","first-page":"4282","DOI":"10.1103\/PhysRevE.51.4282","volume":"51","author":"D Helbing","year":"1995","unstructured":"Helbing, D., Molnar, P.: Social force model for pedestrian dynamics. Phys. Rev. E 51(5), 4282 (1995)","journal-title":"Phys. Rev. E"},{"key":"39_CR11","unstructured":"Lillicrap, T.P., et al.: Continuous control with deep reinforcement learning. arXiv preprint arXiv:1509.02971 (2015)"},{"key":"39_CR12","doi-asserted-by":"crossref","unstructured":"Liu, Y., Xu, A., Chen, Z.: Map-based deep imitation learning for obstacle avoidance. In: 2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 8644\u20138649. IEEE (2018)","DOI":"10.1109\/IROS.2018.8593683"},{"key":"39_CR13","doi-asserted-by":"crossref","unstructured":"Long, P., Fan, T., Liao, X., Liu, W., Zhang, H., Pan, J.: Towards optimally decentralized multi-robot collision avoidance via deep reinforcement learning. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 6252\u20136259. IEEE (2018)","DOI":"10.1109\/ICRA.2018.8461113"},{"issue":"2","key":"39_CR14","doi-asserted-by":"publisher","first-page":"656","DOI":"10.1109\/LRA.2017.2651371","volume":"2","author":"P Long","year":"2017","unstructured":"Long, P., Liu, W., Pan, J.: Deep-learned collision avoidance policy for distributed multiagent navigation. IEEE Robot. Autom. Lett. 2(2), 656\u2013663 (2017)","journal-title":"IEEE Robot. Autom. Lett."},{"key":"39_CR15","unstructured":"Mnih, V., et al.: Playing Atari with deep reinforcement learning. arXiv preprint arXiv:1312.5602 (2013)"},{"issue":"4","key":"39_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3450626.3459670","volume":"37","author":"XB Peng","year":"2018","unstructured":"Peng, X.B., Abbeel, P., Levine, S., van de Panne, M.: DeepMimic: example-guided deep reinforcement learning of physics-based character skills. ACM Trans. Graph. (TOG) 37(4), 1\u201314 (2018)","journal-title":"ACM Trans. Graph. (TOG)"},{"issue":"4","key":"39_CR17","doi-asserted-by":"publisher","first-page":"4423","DOI":"10.1109\/LRA.2018.2869644","volume":"3","author":"M Pfeiffer","year":"2018","unstructured":"Pfeiffer, M., et al.: Reinforced imitation: sample efficient deep reinforcement learning for mapless navigation by leveraging prior demonstrations. IEEE Robot. Autom. Lett. 3(4), 4423\u20134430 (2018)","journal-title":"IEEE Robot. Autom. Lett."},{"key":"39_CR18","doi-asserted-by":"crossref","unstructured":"Reynolds, C.W.: Flocks, herds and schools: a distributed behavioral model. In: Proceedings of the 14th Annual Conference on Computer Graphics and Interactive Techniques, pp. 25\u201334 (1987)","DOI":"10.1145\/37402.37406"},{"key":"39_CR19","unstructured":"Schulman, J., Wolski, F., Dhariwal, P., Radford, A., Klimov, O.: Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347 (2017)"},{"key":"39_CR20","doi-asserted-by":"crossref","unstructured":"Tai, L., Zhang, J., Liu, M., Burgard, W.: Socially compliant navigation through raw depth inputs with generative adversarial imitation learning. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 1111\u20131117. IEEE (2018)","DOI":"10.1109\/ICRA.2018.8460968"},{"key":"39_CR21","doi-asserted-by":"publisher","unstructured":"Van Den Berg, J., Guy, S.J., Lin, M., Manocha, D.: Reciprocal n-body collision avoidance. In: Robotics Research, pp. 3\u201319. Springer (2011). https:\/\/doi.org\/10.1007\/978-3-642-19457-3_1","DOI":"10.1007\/978-3-642-19457-3_1"},{"key":"39_CR22","unstructured":"Vezhnevets, A.S., et al.: Feudal networks for hierarchical reinforcement learning. In: International Conference on Machine Learning, pp. 3540\u20133549. PMLR (2017)"},{"key":"39_CR23","unstructured":"Zhang, C., Lesser, V.: Coordinating multi-agent reinforcement learning with limited communication. In: Proceedings of the 2013 International Conference on Autonomous Agents and Multi-Agent Systems, pp. 1101\u20131108 (2013)"}],"container-title":["Lecture Notes in Computer Science","Advances in Computer Graphics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-89029-2_39","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,11]],"date-time":"2021-10-11T05:53:44Z","timestamp":1633931624000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-89029-2_39"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030890285","9783030890292"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-89029-2_39","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"11 October 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"CGI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Computer Graphics International Conference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 September 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"38","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"cgi2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.cgs-network.org\/cgi21\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"131","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"44","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"9","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"34% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}