{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T05:33:29Z","timestamp":1743053609687,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":29,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819607884"},{"type":"electronic","value":"9789819607891"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-0789-1_28","type":"book-chapter","created":{"date-parts":[[2025,1,23]],"date-time":"2025-01-23T19:26:14Z","timestamp":1737660374000},"page":"381-396","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Free-Form Instruction Guided Robotic Navigation Path Planning with Large Vision-Language Model"],"prefix":"10.1007","author":[{"given":"Yuhao","family":"Du","sequence":"first","affiliation":[]},{"given":"Chengzhong","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Mingtao","family":"Feng","sequence":"additional","affiliation":[]},{"given":"Jianqiao","family":"Luo","sequence":"additional","affiliation":[]},{"given":"Hang","family":"Zhong","sequence":"additional","affiliation":[]},{"given":"Zhiqiang","family":"Miao","sequence":"additional","affiliation":[]},{"given":"Yaonan","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,1,24]]},"reference":[{"key":"28_CR1","doi-asserted-by":"publisher","unstructured":"Li, Y.: Constructing the intelligent expressway traffic monitoring system using the internet of things and inspection robot. J. Supercomput. 80, 8742\u20138766 (2024). https:\/\/doi.org\/10.1007\/s11227-023-05794-z","DOI":"10.1007\/s11227-023-05794-z"},{"key":"28_CR2","doi-asserted-by":"crossref","unstructured":"Fan, C., Zhu, Z., Chen, W., Qin, K., Huang, H., Huang, Z.: Navigation of substation inspection robot based on machine vision. In: ICSETPSD 2023: Proceedings of the First International Conference on Science, Engineering and Technology Practices for Sustainable Development, ICSETPSD 2023, 17th-18th November 2023, Coimbatore, Tamilnadu, India (p. 251). European Alliance for Innovation (2024)","DOI":"10.4108\/eai.17-11-2023.2342732"},{"key":"28_CR3","doi-asserted-by":"crossref","unstructured":"Wang, W., Hao, L., Chen, J.: Design and implementation of multi-function logistics robots for intelligent warehousing. In: Intelligent Equipment and Special Robots, pp. 20\u201329. IOS Press (2024)","DOI":"10.3233\/ATDE240218"},{"key":"28_CR4","doi-asserted-by":"publisher","unstructured":"Gul, F., Rahiman, W., Nazli Alhady, S.S., Chen, K.: A comprehensive study for robot navigation techniques. Cogent Eng. 6(1) (2019). Retrieved from https:\/\/doi.org\/10.1080\/23311916.2019.1632046","DOI":"10.1080\/23311916.2019.1632046"},{"key":"28_CR5","doi-asserted-by":"crossref","unstructured":"Gharbi, A.: Bi-directional adaptive enhanced A* algorithm for mobile robot navigation. Appl. Comput. Inform. (2024)","DOI":"10.1108\/ACI-12-2023-0195"},{"key":"28_CR6","doi-asserted-by":"publisher","unstructured":"Sleaman, W.K., Hameed, A.A., Jamil, A.: Monocular vision with deep neural networks for autonomous mobile robots navigation. Optik, 272, 170162 (2023). https:\/\/doi.org\/10.1016\/j.ijleo.2022.170162","DOI":"10.1016\/j.ijleo.2022.170162"},{"key":"28_CR7","doi-asserted-by":"publisher","first-page":"4205","DOI":"10.1109\/TPAMI.2020.2972281","volume":"43","author":"XE Wang","year":"2020","unstructured":"Wang, X.E., Huang, Q., Celikyilmaz, A., Gao, J., Shen, D., Zhang, L.: Vision-language navigation policy learning and adaptation. IEEE Trans. Pattern Anal. Mach. Intell. 43, 4205\u20134216 (2020)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"28_CR8","doi-asserted-by":"crossref","unstructured":"Huang, C., Mees, O., Zeng, A., Burgard, W.: Visual language maps for robot navigation (2023). Retrieved from https:\/\/arxiv.org\/abs\/2210.05714","DOI":"10.1109\/ICRA48891.2023.10160969"},{"key":"28_CR9","unstructured":"Shah, D., Osinski, B., Ichter, B., Levine, S.: LM-Nav: Robotic Navigation with Large Pre-Trained Models of Language, Vision, and Action (2022). https:\/\/arxiv.org\/abs\/2207.04429"},{"key":"28_CR10","doi-asserted-by":"crossref","unstructured":"Tellex, S., et al.: Understanding natural language commands for robotic navigation and mobile manipulation. In: AAAI Conference on Artificial Intelligence (2011)","DOI":"10.1609\/aaai.v25i1.7979"},{"key":"28_CR11","doi-asserted-by":"crossref","unstructured":"Chen, C., Han, D., Chang, C.C.: MPCCT: Multimodal vision-language learning paradigm with context-based compact Transformer. Pattern Recogn. 147, 110084 (2023)","DOI":"10.1016\/j.patcog.2023.110084"},{"key":"28_CR12","doi-asserted-by":"publisher","unstructured":"Thangavel, K., Palanisamy, N., Muthusamy, S., et al.: A novel method for image captioning using multimodal feature fusion employing mask RNN and LSTM models. Soft Computing. 27(18), 14205\u201314218 (2023). https:\/\/doi.org\/10.1007\/s00500-023-08448-7","DOI":"10.1007\/s00500-023-08448-7"},{"key":"28_CR13","doi-asserted-by":"crossref","unstructured":"Wang, H., Tan, A.H., Nejat, G.: NavFormer: A Transformer Architecture for Robot Target-Driven Navigation in Unknown and Dynamic Environments. ArXiv:abs\/2402.06838 (2024)","DOI":"10.1109\/LRA.2024.3412638"},{"key":"28_CR14","doi-asserted-by":"crossref","unstructured":"Zhang, C., Wang, C., Xu, Q.: MobileNet-deeplabv3+ based robot passable path segmentation and navigation line extraction. In: Proceedings of the 7th International Conference on Computer Science and Application Engineering (2023)","DOI":"10.1145\/3627915.3628092"},{"key":"28_CR15","doi-asserted-by":"publisher","first-page":"365","DOI":"10.1007\/s10462-022-10174-9","volume":"56","author":"S Park","year":"2022","unstructured":"Park, S., Kim, Y.: Visual language navigation: a survey and open challenges. Artif. Intell. Rev. 56, 365\u2013427 (2022)","journal-title":"Artif. Intell. Rev."},{"key":"28_CR16","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1007\/BF01386390","volume":"1","author":"EW Dijkstra","year":"1959","unstructured":"Dijkstra, E.W.: A note on two problems in connexion with graphs. Numer. Math. 1, 269\u2013271 (1959)","journal-title":"Numer. Math."},{"key":"28_CR17","doi-asserted-by":"publisher","unstructured":"Hart, P.E., Nilsson, N.J., Raphael, B.: A formal basis for the heuristic determination of minimum cost paths. IEEE Transact. Syt. Sci. Cybern. 4(2), 100\u2013107 (1968). https:\/\/doi.org\/10.1109\/TSSC.1968.300136","DOI":"10.1109\/TSSC.1968.300136"},{"key":"28_CR18","unstructured":"LaValle, S.M.: Rapidly-exploring random trees: A new tool for path planning. The Annual Research Report (1998)"},{"key":"28_CR19","doi-asserted-by":"crossref","unstructured":"Almazrouei, K.S., Kamel, I.,Rabie, T.: Dynamic obstacle avoidance and path planning through reinforcement learning. Applied Sciences (2023)","DOI":"10.3390\/app13148174"},{"key":"28_CR20","doi-asserted-by":"crossref","unstructured":"Liu, H., Shen, Y., Yu, S., Gao, Z., Wu, T.: Deep Reinforcement Learning for Mobile Robot Path Planning. arXiv preprint arXiv:2404.06974 (2024)","DOI":"10.53469\/jtpes.2024.04(04).07"},{"key":"28_CR21","doi-asserted-by":"crossref","unstructured":"Xu, S., Wang, H., Gao, J., Ouyang, Y., Yu, C., Wu, Y.: LAGOON: Language-Guided Motion Control. arXiv preprint arXiv:2306.10518 (2024)","DOI":"10.1109\/ICRA57147.2024.10610467"},{"key":"28_CR22","doi-asserted-by":"crossref","unstructured":"Zand, M., Kodur, K.C., Kyrarini, M.: Automatic generation of robot actions for collaborative tasks from speech. In: 2023 9th International Conference on Automation, Robotics and Applications (ICARA), pp. 155\u2013159 (2023)","DOI":"10.1109\/ICARA56516.2023.10125800"},{"key":"28_CR23","doi-asserted-by":"crossref","unstructured":"Zhou, G., Hong, Y., Wu, Q.: NavGPT: explicit reasoning in vision-and-language navigation with large language models. In: AAAI Conference on Artificial Intelligence (2023)","DOI":"10.1609\/aaai.v38i7.28597"},{"key":"28_CR24","doi-asserted-by":"crossref","unstructured":"Anderson, P., et al.: Vision-and-Language Navigation: Interpreting visually-grounded navigation instructions in real environments. arXiv preprint arXiv:1711.07280 (2018)","DOI":"10.1109\/CVPR.2018.00387"},{"issue":"1054","key":"28_CR25","doi-asserted-by":"publisher","first-page":"1054","DOI":"10.1109\/TNN.1998.712192","volume":"9","author":"RS Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement learning: an introduction. IEEE Trans. Neural Networks 9(1054), 1054 (1998)","journal-title":"IEEE Trans. Neural Networks"},{"key":"28_CR26","doi-asserted-by":"crossref","unstructured":"Hafner, M., et al.: CLIP and complementary methods. Nature Reviews Methods Primers 1 (2011)","DOI":"10.1038\/s43586-021-00018-1"},{"key":"28_CR27","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Neural Information Processing Systems (2017)"},{"key":"28_CR28","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition. Proc. IEEE 86, 2278\u20132324 (1998)","journal-title":"Proc. IEEE"},{"key":"28_CR29","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9, 1735\u20131780 (1997)","journal-title":"Neural Comput."}],"container-title":["Lecture Notes in Computer Science","Intelligent Robotics and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-0789-1_28","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,23]],"date-time":"2025-01-23T19:26:24Z","timestamp":1737660384000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-0789-1_28"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819607884","9789819607891"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-0789-1_28","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"24 January 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICIRA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Robotics and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Xi'an","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"31 July 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 August 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icira2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.icira2024.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}