{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T18:19:01Z","timestamp":1769019541524,"version":"3.49.0"},"reference-count":17,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,1,21]],"date-time":"2025-01-21T00:00:00Z","timestamp":1737417600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,1,21]],"date-time":"2025-01-21T00:00:00Z","timestamp":1737417600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,1,21]]},"DOI":"10.1109\/sii59315.2025.10870971","type":"proceedings-article","created":{"date-parts":[[2025,2,12]],"date-time":"2025-02-12T18:17:07Z","timestamp":1739384227000},"page":"193-198","source":"Crossref","is-referenced-by-count":3,"title":["Scalable, Training-Free Visual Language Robotics: a modular multi-model framework for consumer-grade GPUs"],"prefix":"10.1109","author":[{"given":"Marie","family":"Samson","sequence":"first","affiliation":[{"name":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory),Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bastien","family":"Muraccioli","sequence":"additional","affiliation":[{"name":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory),Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fumio","family":"Kanehiro","sequence":"additional","affiliation":[{"name":"National Institute of Advanced Industrial Science and Technology (AIST),CNRS-AIST JRL (Joint Robotics Laboratory),Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Open x-embodiment: Robotic learning datasets and rt-x models","author":"Collaboration","year":"2024"},{"key":"ref2","article-title":"Openvla: An open-source vision-language-action model","author":"Kim","year":"2024"},{"key":"ref3","article-title":"Rt-2: Vision-language-action models transfer web knowledge to robotic control","author":"Brohan","year":"2023"},{"key":"ref4","article-title":"Pali-x: On scaling up a multilingual vision and language model","author":"Chen","year":"2023"},{"key":"ref5","article-title":"Palm-e: An embodied multimodal language model","author":"Driess","year":"2023"},{"key":"ref6","article-title":"Few-shot image classification and segmentation as visual question answering using vision-language models","author":"Meng","year":"2024"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00695"},{"key":"ref10","author":"Yoshida","year":"2023","journal-title":"From text to motion: Grounding gpt-4 in a humanoid robot \"alter3\""},{"key":"ref11","volume-title":"Gpt-4 technical report","author":"Achiam","year":"2024"},{"key":"ref12","article-title":"Language to rewards for robotic skill synthesis","author":"Yu","year":"2023"},{"key":"ref13","article-title":"Predictive sampling: Real-time behaviour synthesis with mujoco","author":"Howell","year":"2022"},{"key":"ref14","article-title":"Large language models for robotics: A survey","author":"Zeng","year":"2023"},{"key":"ref15","first-page":"arXiv:2404.14219","article-title":"Phi-3 Technical Report: A Highly Capable Language Model Locally on Your Phone","author":"Abdin","year":"2024"},{"key":"ref16","article-title":"Internvl: Scaling up vision foundation models and aligning for generic visual-linguistic tasks","author":"Chen","year":"2024"},{"key":"ref17","volume-title":"all-minilm-l6-v2","author":"Reimers","year":"2021"}],"event":{"name":"2025 IEEE\/SICE International Symposium on System Integration (SII)","location":"Munich, Germany","start":{"date-parts":[[2025,1,21]]},"end":{"date-parts":[[2025,1,24]]}},"container-title":["2025 IEEE\/SICE International Symposium on System Integration (SII)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10870372\/10870581\/10870971.pdf?arnumber=10870971","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,20]],"date-time":"2025-02-20T19:49:30Z","timestamp":1740080970000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10870971\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,21]]},"references-count":17,"URL":"https:\/\/doi.org\/10.1109\/sii59315.2025.10870971","relation":{},"subject":[],"published":{"date-parts":[[2025,1,21]]}}}