{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T11:29:30Z","timestamp":1764588570101,"version":"3.28.0"},"reference-count":22,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,10,27]]},"DOI":"10.1109\/icip51287.2024.10647728","type":"proceedings-article","created":{"date-parts":[[2024,9,27]],"date-time":"2024-09-27T18:34:45Z","timestamp":1727462085000},"page":"2599-2605","source":"Crossref","is-referenced-by-count":1,"title":["Towards Generalizable Referring Image Segmentation Via Target Prompt And Visual Coherence"],"prefix":"10.1109","author":[{"given":"Yajie","family":"Liu","sequence":"first","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]},{"given":"Pu","family":"Ge","sequence":"additional","affiliation":[{"name":"Hangzhou Innovation Institute Beihang University,Beijing,China"}]},{"given":"Haoxiang","family":"Ma","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]},{"given":"Shichao","family":"Fan","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]},{"given":"Qingjie","family":"Liu","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]},{"given":"Di","family":"Huang","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]},{"given":"Yunhong","family":"Wang","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46475-6_5"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01762"},{"key":"ref3","first-page":"787","article-title":"Referring to objects in photographs of natural scenes","volume":"28","author":"KAZEMZADE","year":"2014","journal-title":"EMNLP"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01146"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01267"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.00394"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19818-2_42"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01601"},{"key":"ref9","first-page":"14729","article-title":"Coupalign: Coupling word-pixel with sentence-mask alignments for referring image segmentation","volume":"35","author":"Zhang","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01789"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.357"},{"key":"ref12","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","author":"Radford","year":"2021","journal-title":"ICML."},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01864"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02257"},{"key":"ref15","first-page":"10012","article-title":"Swin transformer: Hierarchical vision transformer using shifted windows","author":"Liu","year":"2021","journal-title":"CVPR"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.028"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1162"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-022-01653-1"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.9"},{"key":"ref20","article-title":"The iapr tc-12 benchmark: A new evaluation resource for visual information systems","volume-title":"OntoImage 2006 Workshop on Language Resources for Content-based Image Retrieval during LREC 2006 Final Programme","volume":"2","author":"Grubinger"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01139"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01605"}],"event":{"name":"2024 IEEE International Conference on Image Processing (ICIP)","start":{"date-parts":[[2024,10,27]]},"location":"Abu Dhabi, United Arab Emirates","end":{"date-parts":[[2024,10,30]]}},"container-title":["2024 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10647221\/10647122\/10647728.pdf?arnumber=10647728","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,28]],"date-time":"2024-09-28T05:15:33Z","timestamp":1727500533000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10647728\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,27]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/icip51287.2024.10647728","relation":{},"subject":[],"published":{"date-parts":[[2024,10,27]]}}}