{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T15:07:49Z","timestamp":1778080069830,"version":"3.51.4"},"reference-count":39,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2025,2,1]],"date-time":"2025-02-01T00:00:00Z","timestamp":1738368000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,2,1]],"date-time":"2025-02-01T00:00:00Z","timestamp":1738368000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,2,1]],"date-time":"2025-02-01T00:00:00Z","timestamp":1738368000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62373016"],"award-info":[{"award-number":["62373016"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62273012"],"award-info":[{"award-number":["62273012"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Open Projects Program of State Key Laboratory of Multimodal Artificial Intelligence Systems","award":["MAIS-2023-22"],"award-info":[{"award-number":["MAIS-2023-22"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Ind. Inf."],"published-print":{"date-parts":[[2025,2]]},"DOI":"10.1109\/tii.2024.3488774","type":"journal-article","created":{"date-parts":[[2024,11,19]],"date-time":"2024-11-19T18:51:03Z","timestamp":1732042263000},"page":"1783-1792","source":"Crossref","is-referenced-by-count":6,"title":["Language-Guided Category Push\u2013Grasp Synergy Learning in Clutter by Efficiently Perceiving Object Manipulation Space"],"prefix":"10.1109","volume":"21","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6418-0675","authenticated-orcid":false,"given":"Min","family":"Zhao","sequence":"first","affiliation":[{"name":"School of Information Science and Technology, Beijing University of Technology, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7624-4728","authenticated-orcid":false,"given":"Guoyu","family":"Zuo","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Beijing University of Technology, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1673-0844","authenticated-orcid":false,"given":"Shuangyue","family":"Yu","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Beijing University of Technology, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0651-8794","authenticated-orcid":false,"given":"Yongkang","family":"Luo","sequence":"additional","affiliation":[{"name":"Institute of Automation, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Chunfang","family":"Liu","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Beijing University of Technology, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2492-9159","authenticated-orcid":false,"given":"Daoxiong","family":"Gong","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Beijing University of Technology, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2020.2969680"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TIE.2022.3212422"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TIM.2023.3241078"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561675"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2023.3244186"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2970622"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561073"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3204822"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10342533"},{"key":"ref10","first-page":"1140","article-title":"Segnext: Rethinking convolutional attention design for semantic segmentation","volume-title":"Proc. Adv. Neural Informat. Process. Syst.","volume":"35","author":"Guo","year":"2022"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01755"},{"key":"ref12","first-page":"23033","article-title":"Segclip: Patch aggregation with learnable centers for open-vocabulary semantic segmentation","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Luo","year":"2023"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00288"},{"key":"ref14","first-page":"32215","article-title":"Convolutions die hard: Open-vocabulary segmentation with single frozen convolutional clip","volume-title":"Proc. Adv. Neural Informat. Process. Syst.","volume":"36","author":"Yu","year":"2024"},{"key":"ref15","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Radford","year":"2021"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2024.3381639"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IROS47612.2022.9981510"},{"key":"ref18","article-title":"Multimodal knowledge alignment with reinforcement learning","author":"Yu","year":"2022"},{"key":"ref19","first-page":"2026","article-title":"Visuo-tactile transformers for manipulation","volume-title":"Proc. 6th Annu. Conf. Robot Learn.","author":"Chen","year":"2022"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2024.3357432"},{"key":"ref21","article-title":"Reasoning grasping via multimodal large language model","author":"Jin","year":"2024"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10341379"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/icra48891.2023.10161041"},{"key":"ref24","article-title":"Language-guided robot grasping: Clip-based referring grasp synthesis in clutter","author":"Tziafas","year":"2023"},{"key":"ref25","first-page":"178","article-title":"Language embedded radiance fields for zero-shot task-oriented grasping","volume-title":"Proc. Conf. Robot Learn.","author":"Rashid","year":"2023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561994"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10342331"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8593986"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3092640"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1049\/cit2.12264"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2024.3357084"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TIM.2024.3379048"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TETCI.2022.3141105"},{"key":"ref34","article-title":"Playing atari with deep reinforcement learning","author":"Mnih"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.5555\/3045118.3045167"},{"key":"ref37","article-title":"Is attention better than matrix decomposition","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Geng","year":"2020"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.3390\/s20143816"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1177\/0278364919868017"}],"container-title":["IEEE Transactions on Industrial Informatics"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/9424\/10874841\/10758335.pdf?arnumber=10758335","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,6]],"date-time":"2025-02-06T06:04:09Z","timestamp":1738821849000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10758335\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2]]},"references-count":39,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/tii.2024.3488774","relation":{},"ISSN":["1551-3203","1941-0050"],"issn-type":[{"value":"1551-3203","type":"print"},{"value":"1941-0050","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2]]}}}