{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T19:16:53Z","timestamp":1774120613176,"version":"3.50.1"},"reference-count":16,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,8,28]],"date-time":"2024-08-28T00:00:00Z","timestamp":1724803200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,8,28]],"date-time":"2024-08-28T00:00:00Z","timestamp":1724803200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,8,28]]},"DOI":"10.1109\/iwis62722.2024.10706068","type":"proceedings-article","created":{"date-parts":[[2024,10,10]],"date-time":"2024-10-10T17:21:42Z","timestamp":1728580902000},"page":"1-4","source":"Crossref","is-referenced-by-count":2,"title":["Generating Robot Action Sequences: An Efficient Vision-Language Models with Visual Prompts"],"prefix":"10.1109","author":[{"given":"Weihao","family":"CAI","sequence":"first","affiliation":[{"name":"Ritsumeikan University,Interaction Laboratory,Osaka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yoshiki","family":"MORI","sequence":"additional","affiliation":[{"name":"Ritsumeikan University,Interaction Laboratory,Osaka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nobutaka","family":"SHIMADA","sequence":"additional","affiliation":[{"name":"Ritsumeikan University,Interaction Laboratory,Osaka,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2011.vii.008"},{"issue":"6","key":"ref2","doi-asserted-by":"crossref","first-page":"856","DOI":"10.1541\/ieejeiss.125.856","article-title":"Motion imitation of robots interacting with the environment through sensorimotor integration","volume":"l25","author":"Onishi","year":"2005","journal-title":"IEEJ Trans. EIS"},{"key":"ref3","volume-title":"Openai api: Gpt-40","year":"2024"},{"key":"ref4","volume-title":"Anthropic: Claude-3\u20130pus","year":"2024"},{"key":"ref5","article-title":"LIm as a robotic brain: Unifying egocentric memory and control","author":"Mai","year":"2023","journal-title":"arXiv preprint 35"},{"key":"ref6","first-page":"17","article-title":"Blip-2: Bootstrappinglanguageimage pre-training with frozen image encoders and large language models","author":"Li","year":"2023","journal-title":"arXiv preprint"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3310935"},{"key":"ref8","first-page":"19","article-title":"Video chatcaptioner: Towards the enriched spatiotemporal descriptions","author":"Chen","year":"2023","journal-title":"arXiv preprint"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-emnlp.755"},{"issue":"3","key":"ref10","article-title":"Fine-grained visual prompting","volume":"2","author":"Yang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref11","article-title":"Set-of-mark prompting unleashes extraordinary visual grounding in gpt-4v","author":"Yang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref12","article-title":"Moka: Open-vocabulary robotic manipulation through mark-based visual prompting","author":"Liu","year":"2024","journal-title":"arXiv preprint"},{"key":"ref13","article-title":"Look before you leap: Unveiling the power of gpt- 4v in robotic vision-language planning","author":"Hu","year":"2023","journal-title":"arXiv preprint"},{"key":"ref14","volume-title":"RT CORPORATION","year":"2024"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref17","volume-title":"Lora: Low-rank adaptation of large language models","author":"Hu","year":"2021"}],"event":{"name":"2024 International Workshop on Intelligent Systems (IWIS)","location":"Ulsan, Korea, Republic of","start":{"date-parts":[[2024,8,28]]},"end":{"date-parts":[[2024,8,30]]}},"container-title":["2024 International Workshop on Intelligent Systems (IWIS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10706037\/10706026\/10706068.pdf?arnumber=10706068","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,11]],"date-time":"2024-10-11T04:33:27Z","timestamp":1728621207000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10706068\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,28]]},"references-count":16,"URL":"https:\/\/doi.org\/10.1109\/iwis62722.2024.10706068","relation":{},"subject":[],"published":{"date-parts":[[2024,8,28]]}}}