{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:40:34Z","timestamp":1757619634230,"version":"3.44.0"},"publisher-location":"Singapore","reference-count":18,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819699070"},{"type":"electronic","value":"9789819699087"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-9908-7_11","type":"book-chapter","created":{"date-parts":[[2025,7,24]],"date-time":"2025-07-24T16:26:17Z","timestamp":1753374377000},"page":"125-139","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["ILearnRobot: An Interactive Learning-Based Multi-modal Robot with Continuous Improvement"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-9720-7156","authenticated-orcid":false,"given":"Kohou","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-2492-403X","authenticated-orcid":false,"given":"ZhaoXiang","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-6035-2482","authenticated-orcid":false,"given":"Lin","family":"Bai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-4958-4907","authenticated-orcid":false,"given":"Kun","family":"Fan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1267-0277","authenticated-orcid":false,"given":"Xiang","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-6697-3220","authenticated-orcid":false,"given":"Huan","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1171-0281","authenticated-orcid":false,"given":"Kai","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4308-7049","authenticated-orcid":false,"given":"Shiguo","family":"Lian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,7,25]]},"reference":[{"key":"11_CR1","doi-asserted-by":"crossref","unstructured":"Chi, T.C., Shen, M., Eric, M., Kim, S., Hakkani-Tur, D.: Just ask: An interactive learning framework for vision and language navigation. In: Proceedings of the AAAI conference on artificial intelligence. 34, 2459--2466 (2020)","DOI":"10.1609\/aaai.v34i03.5627"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Deng, Y., Guo, D., Guo, X., Zhang, N., Liu, H., Sun, F.: Mqa: Answering the question via robotic manipulation. arXiv preprint arXiv:2003.04641 (2020)","DOI":"10.15607\/RSS.2021.XVII.044"},{"key":"11_CR3","unstructured":"Driess, D., Xia, F., Sajjadi, M.S., Lynch, C., Chowdhery, A., Ichter, B., Wahid, A., Tompson, J., Vuong, Q., Yu, T., et al.: Palm-e: An embodied multimodal language model. arXiv preprint arXiv:2303.03378 (2023)"},{"key":"11_CR4","unstructured":"Hu, E.J., Shen, Y., Wallis, P., Allen-Zhu, Z., Li, Y., Wang, S., Wang, L., Chen, W.: Lora: Low-rank adaptation of large language models. arXiv preprint arXiv:2106.09685 (2021)"},{"issue":"2","key":"11_CR5","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1080\/23270012.2020.1756939","volume":"7","author":"Y Kang","year":"2020","unstructured":"Kang, Y., Cai, Z., Tan, C.W., Huang, Q., Liu, H.: Natural language processing (nlp) in management research: A literature review. Journal of Management Analytics. 7(2), 139\u2013172 (2020)","journal-title":"Journal of Management Analytics."},{"key":"11_CR6","doi-asserted-by":"crossref","unstructured":"Kenfack, F.K., Siddiky, F.A., Balint-Benczedi, F., Beetz, M.: Robotvqa\u2014a scenegraph-and deep-learning-based visual question answering system for robot manipulation. In: 2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS). 9667--9674 (2020)","DOI":"10.1109\/IROS45743.2020.9341186"},{"key":"11_CR7","unstructured":"Liu, H., Li, C., Li, Y., Li, B., Zhang, Y., Shen, S., Lee, Y.J.: Llava-next: Improved reasoning, ocr, and world knowledge. (2024)"},{"key":"11_CR8","first-page":"2434","volume":"36","author":"H Liu","year":"2024","unstructured":"Liu, H., Li, C., Wu, Q., Lee, Y.J.: Visual instruction tuning. Adv. Neural. Inf. Process. Syst. 36, 2434\u20132447 (2024)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Menezes, J.C.: Mumodar: Multi-modal framework for human-robot collaboration in cyber-physical systems. In: Companion of the 2024 ACM\/IEEE International Conference on Human-Robot Interaction. 755--759 (2024)","DOI":"10.1145\/3610978.3640688"},{"issue":"3","key":"11_CR10","doi-asserted-by":"publisher","first-page":"722","DOI":"10.3390\/s20030722","volume":"20","author":"S M\u00fcller","year":"2020","unstructured":"M\u00fcller, S., Wengefeld, T., Trinh, T.Q., Aganian, D., Eisenbach, M., Gross, H.M.: A multi-modal person perception framework for socially interactive mobile service robots. Sensors. 20(3), 722 (2020)","journal-title":"Sensors."},{"key":"11_CR11","unstructured":"Paranjape, B., Lundberg, S., Singh, S., Hajishirzi, H., Zettlemoyer, L., Ribeiro, M.T.: Art: Automatic multi-step reasoning and tool-use for large language models. arXiv preprint arXiv:2303.09014 (2023)"},{"key":"11_CR12","unstructured":"Radford, A., Kim, J.W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., Clark, J., et al.: Learning transferable visual models from natural language supervision. In: International conference on machine learning. 8748--8763 (2021)"},{"key":"11_CR13","doi-asserted-by":"crossref","unstructured":"Thomason, J., Padmakumar, A., Sinapov, J., Walker, N., Jiang, Y., Yedidsion, H., Hart, J., Stone, P., Mooney, R.J.: Improving grounded natural language understanding through human-robot dialog. In: 2019 International Conference on Robotics and Automation (ICRA). 6934--6941 (2019)","DOI":"10.1109\/ICRA.2019.8794287"},{"key":"11_CR14","doi-asserted-by":"crossref","unstructured":"Wu, J., Gan, W., Chen, Z., Wan, S., Philip, S.Y.: Multimodal large language models: A survey. In: 2023 IEEE International Conference on Big Data (BigData). 2247--2256 (2023)","DOI":"10.1109\/BigData59044.2023.10386743"},{"key":"11_CR15","unstructured":"Yang, Z., Li, L., Wang, J., Lin, K., Azarnasab, E., Ahmed, F., Liu, Z., Liu, C., Zeng, M., Wang, L.: Mm-react: Prompting chatgpt for multimodal reasoning and action. arXiv preprint arXiv:2303.11381 (2023)"},{"key":"11_CR16","doi-asserted-by":"crossref","unstructured":"Yao, Y., Duan, J., Xu, K., Cai, Y., Sun, Z., Zhang, Y.: A survey on large language model (llm) security and privacy: The good, the bad, and the ugly. High-Confidence Computing. 100211 (2024)","DOI":"10.1016\/j.hcc.2024.100211"},{"key":"11_CR17","doi-asserted-by":"crossref","unstructured":"Zha, L., Cui, Y., Lin, L.H., Kwon, M., Arenas, M.G., Zeng, A., Xia, F., Sadigh, D.: Distilling and retrieving generalizable knowledge for robot manipulation via language corrections. arXiv preprint arXiv:2311.10678 (2023)","DOI":"10.1109\/ICRA57147.2024.10610455"},{"key":"11_CR18","doi-asserted-by":"crossref","unstructured":"Zhu, F., Zhu, Y., Chang, X., Liang, X.: Vision-language navigation with self-supervised auxiliary reasoning tasks. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 10012--10022 (2020)","DOI":"10.1109\/CVPR42600.2020.01003"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-9908-7_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,7]],"date-time":"2025-09-07T22:04:10Z","timestamp":1757282650000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-9908-7_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819699070","9789819699087"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-9908-7_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"25 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}