{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T22:51:03Z","timestamp":1747176663888,"version":"3.40.5"},"reference-count":24,"publisher":"Informa UK Limited","issue":"18","content-domain":{"domain":["www.tandfonline.com"],"crossmark-restriction":true},"short-container-title":["Advanced Robotics"],"published-print":{"date-parts":[[2024,9,16]]},"DOI":"10.1080\/01691864.2024.2366995","type":"journal-article","created":{"date-parts":[[2024,6,28]],"date-time":"2024-06-28T07:27:55Z","timestamp":1719559675000},"page":"1255-1264","update-policy":"https:\/\/doi.org\/10.1080\/tandf_crossmark_01","source":"Crossref","is-referenced-by-count":0,"title":["Robotic environmental state recognition with pre-trained vision-language models and black-box optimization"],"prefix":"10.1080","volume":"38","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7464-7187","authenticated-orcid":false,"given":"Kento","family":"Kawaharazuka","sequence":"first","affiliation":[{"name":"The Department of Mechano-Informatics, Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1429-4401","authenticated-orcid":false,"given":"Yoshiki","family":"Obinata","sequence":"additional","affiliation":[{"name":"The Department of Mechano-Informatics, Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"}]},{"given":"Naoaki","family":"Kanazawa","sequence":"additional","affiliation":[{"name":"The Department of Mechano-Informatics, Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"}]},{"given":"Kei","family":"Okada","sequence":"additional","affiliation":[{"name":"The Department of Mechano-Informatics, Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"}]},{"given":"Masayuki","family":"Inaba","sequence":"additional","affiliation":[{"name":"The Department of Mechano-Informatics, Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"}]}],"member":"301","published-online":{"date-parts":[[2024,6,28]]},"reference":[{"key":"e_1_3_2_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICHR.2006.321356"},{"key":"e_1_3_2_3_1","unstructured":"Saito M Chen H Okada K et al. Semantic object search in large-scale indoor environments. In: IEEE\/RSJ International Conference on Intelligent Robots and Systems Workshop on Active Semantic Perception and Object Search in the Real World; San Francisco USA; 2011."},{"key":"e_1_3_2_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/6462.6464"},{"key":"e_1_3_2_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.autcon.2017.10.016"},{"key":"e_1_3_2_6_1","doi-asserted-by":"publisher","DOI":"10.1177\/1729881420932715"},{"key":"e_1_3_2_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2010.5509923"},{"key":"e_1_3_2_8_1","doi-asserted-by":"publisher","DOI":"10.3390\/s20205753"},{"key":"e_1_3_2_9_1","unstructured":"Li F Zhang H Zhang Y et\u00a0al. Vision-language intelligence: tasks representation learning and large models. arXiv preprint arXiv:2203.01922 2022."},{"key":"e_1_3_2_10_1","unstructured":"Li J Li D Savarese S et al. BLIP-2: bootstrapping language-image pre-training with frozen image encoders and large language models. In: Proceedings of the 40th International Conference on Machine Learning;\u00a0Hawaii USA; 2023. p. 19730\u201319742."},{"key":"e_1_3_2_11_1","unstructured":"Wang P Yang A Men R et al. OFA: unifying architectures tasks and modalities through a simple sequence-to-sequence learning framework. In: Proceedings of the 39th International Conference on Machine Learning; Maryland USA; 2022. p. 23318\u201323340."},{"key":"e_1_3_2_12_1","unstructured":"Radford A Kim JW Hallacy C et\u00a0al. Learning transferable visual models from natural language supervision. In: Proceedings of the 38th International Conference on Machine Learning. 2021. p. 8748\u20138763."},{"key":"e_1_3_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01457"},{"key":"e_1_3_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160969"},{"key":"e_1_3_2_15_1","unstructured":"Shafiullah NMM Paxton C Pinto L et\u00a0al. CLIP-fields: weakly supervised semantic fields for robotic memory. In: Proceedings of the 2020 Robotics: Science and Systems. 2023. p. 1\u201311."},{"key":"e_1_3_2_16_1","unstructured":"Liu Z Bahety A Song S. REFLECT: summarizing robot experiences for failure explanation and correction. In: Proceedings of the 2023 Conference on Robot Learning; Georgia USA; 2023. p. 1\u201317."},{"key":"e_1_3_2_17_1","unstructured":"Huang W Wang C Zhang R et al. VoxPoser: composable 3D value maps for robotic manipulation with language models. In: Proceedings of the 2023 Conference on Robot Learning; Georgia USA; 2023. p. 1\u201323."},{"key":"e_1_3_2_18_1","unstructured":"Shah D Equi MR Osi\u0144ski B et al. Navigation with large language models: semantic guesswork as a heuristic for planning. In: Proceedings of the 2023 Conference on Robot Learning; Georgia USA; 2023. p. 2683\u20132699."},{"key":"e_1_3_2_19_1","unstructured":"Shridhar M Manuelli L Fox D. CLIPort: what and where pathways for robotic manipulation. In: Proceedings of the 2021 Conference on Robot Learning;\u00a0London UK; 2021. p. 1\u201313."},{"key":"e_1_3_2_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids57100.2023.10375211"},{"key":"e_1_3_2_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160390"},{"key":"e_1_3_2_22_1","first-page":"2171","article-title":"DEAP: evolutionary algorithms made easy","volume":"13","author":"Fortin F","year":"2012","unstructured":"Fortin F, Rainville FD, Gardner M, et\u00a0al. DEAP: evolutionary algorithms made easy. J Mach Learn Res. 2012;13:2171\u20132175.","journal-title":"J Mach Learn Res"},{"key":"e_1_3_2_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3375257"},{"key":"e_1_3_2_24_1","unstructured":"Achiam J Adler S Agarwal S et\u00a0al. GPT-4 technical report. arXiv preprint arXiv:2303.08774. 2023."},{"key":"e_1_3_2_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-44851-5_42"}],"container-title":["Advanced Robotics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.tandfonline.com\/doi\/pdf\/10.1080\/01691864.2024.2366995","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,17]],"date-time":"2024-10-17T17:40:15Z","timestamp":1729186815000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.tandfonline.com\/doi\/full\/10.1080\/01691864.2024.2366995"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,28]]},"references-count":24,"journal-issue":{"issue":"18","published-print":{"date-parts":[[2024,9,16]]}},"alternative-id":["10.1080\/01691864.2024.2366995"],"URL":"https:\/\/doi.org\/10.1080\/01691864.2024.2366995","relation":{},"ISSN":["0169-1864","1568-5535"],"issn-type":[{"type":"print","value":"0169-1864"},{"type":"electronic","value":"1568-5535"}],"subject":[],"published":{"date-parts":[[2024,6,28]]},"assertion":[{"value":"The publishing and review policy for this title is described in its Aims & Scope.","order":1,"name":"peerreview_statement","label":"Peer Review Statement"},{"value":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tadr20","URL":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tadr20","order":2,"name":"aims_and_scope_url","label":"Aim & Scope"},{"value":"2023-10-31","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2024-03-26","order":1,"name":"revised","label":"Revised","group":{"name":"publication_history","label":"Publication History"}},{"value":"2024-05-31","order":2,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2024-06-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}