{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T23:29:18Z","timestamp":1777937358704,"version":"3.51.4"},"reference-count":26,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,11,26]],"date-time":"2024-11-26T00:00:00Z","timestamp":1732579200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,11,26]],"date-time":"2024-11-26T00:00:00Z","timestamp":1732579200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,26]]},"DOI":"10.1109\/fllm63129.2024.10852498","type":"proceedings-article","created":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T18:35:23Z","timestamp":1738089323000},"page":"501-507","source":"Crossref","is-referenced-by-count":25,"title":["VLM-Auto: VLM-based Autonomous Driving Assistant with Human-like Behavior and Understanding for Complex Road Scenes"],"prefix":"10.1109","author":[{"given":"Ziang","family":"Guo","sequence":"first","affiliation":[{"name":"Intelligent Space Robotics Laboratory Skoltech,Moscow,Russia"}]},{"given":"Zakhar","family":"Yagudin","sequence":"additional","affiliation":[{"name":"Intelligent Space Robotics Laboratory Skoltech,Moscow,Russia"}]},{"given":"Artem","family":"Lykov","sequence":"additional","affiliation":[{"name":"Intelligent Space Robotics Laboratory Skoltech,Moscow,Russia"}]},{"given":"Mikhail","family":"Konenkov","sequence":"additional","affiliation":[{"name":"Intelligent Space Robotics Laboratory Skoltech,Moscow,Russia"}]},{"given":"Dzmitry","family":"Tsetserukou","sequence":"additional","affiliation":[{"name":"Intelligent Space Robotics Laboratory Skoltech,Moscow,Russia"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01712"},{"key":"ref2","article-title":"Goal-oriented autonomous driving","author":"Hu","year":"2022"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.01432"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/SMC54092.2024.10831380"},{"key":"ref5","article-title":"Dme-driver: Integrating human decision logic and 3d scene perception in autonomous driving","author":"Han","year":"2024"},{"key":"ref6","article-title":"Llms can\u2019t plan, but can help planning in llm-modulo frameworks","author":"Kambhampati","year":"2024"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01319"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02105"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01674"},{"key":"ref10","article-title":"Gpt-driver: Learning to drive with gpt","author":"Mao","year":"2023"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3610978.3641080"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01416"},{"key":"ref13","article-title":"Llm-assist: Enhancing closed-loop planning with language-based reasoning","author":"Sharan","year":"2023"},{"key":"ref14","article-title":"Large language models for autonomous driving: Real-world experiments","author":"Cui","year":"2023"},{"key":"ref15","article-title":"Empowering autonomous driving with large language models: A safety perspective","author":"Wang","year":"2023"},{"key":"ref16","article-title":"Drivelm: Driving with graph visual question answering","author":"Sima","year":"2023"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.075"},{"key":"ref18","article-title":"Drivevlm: The convergence of autonomous driving and large vision-language models","author":"Tian","year":"2024"},{"key":"ref19","article-title":"A survey on hallucination in large language models: Principles, taxonomy, challenges, and open questions","author":"Huang","year":"2023"},{"key":"ref20","first-page":"1","article-title":"CARLA: An open urban driving simulator","volume-title":"Proceedings of the 1st Annual Conference on Robot Learning","author":"Dosovitskiy"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abm6074"},{"key":"ref22","article-title":"Qwen-vl: A frontier large vision-language model with versatile abilities","author":"Bai","year":"2023"},{"key":"ref23","article-title":"Qwen technical report","author":"Bai","year":"2023"},{"key":"ref24","article-title":"Qlora: Efficient finetuning of quantized llms","volume":"36","author":"Dettmers","year":"2024","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i11.26505"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/IV55156.2024.10588447"}],"event":{"name":"2024 2nd International Conference on Foundation and Large Language Models (FLLM)","location":"Dubai, United Arab Emirates","start":{"date-parts":[[2024,11,26]]},"end":{"date-parts":[[2024,11,29]]}},"container-title":["2024 2nd International Conference on Foundation and Large Language Models (FLLM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10852419\/10852420\/10852498.pdf?arnumber=10852498","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,29]],"date-time":"2025-01-29T06:47:11Z","timestamp":1738133231000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10852498\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,26]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/fllm63129.2024.10852498","relation":{},"subject":[],"published":{"date-parts":[[2024,11,26]]}}}