{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:21:45Z","timestamp":1740100905029,"version":"3.37.3"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,7,18]],"date-time":"2022-07-18T00:00:00Z","timestamp":1658102400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,7,18]],"date-time":"2022-07-18T00:00:00Z","timestamp":1658102400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"NSFC","doi-asserted-by":"publisher","award":["62072399,U19B2042"],"award-info":[{"award-number":["62072399,U19B2042"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,7,18]]},"DOI":"10.1109\/icme52920.2022.9859991","type":"proceedings-article","created":{"date-parts":[[2022,8,26]],"date-time":"2022-08-26T19:45:18Z","timestamp":1661543118000},"page":"1-6","source":"Crossref","is-referenced-by-count":0,"title":["Diverse Instance Discovery: Vision-Transformer for Instance-Aware Multi-Label Image Recognition"],"prefix":"10.1109","author":[{"given":"Yunqing","family":"Hu","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Xuan","family":"Jin","sequence":"additional","affiliation":[{"name":"Alibaba Group,Hangzhou,China"}]},{"given":"Yin","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Haiwen","family":"Hong","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Jingfeng","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Feihu","family":"Yan","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Yuan","family":"He","sequence":"additional","affiliation":[{"name":"Alibaba Group,Hangzhou,China"}]},{"given":"Hui","family":"Xue","sequence":"additional","affiliation":[{"name":"Alibaba Group,Hangzhou,China"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00061"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2021\/163"},{"key":"ref12","first-page":"1696","article-title":"Joint input and output space learning for multi-label image classification","volume":"23","author":"xu","year":"2020","journal-title":"TMM"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"ref14","article-title":"Semi-supervised classification with graph convolutional networks","author":"kipf","year":"2016","journal-title":"ArXiv Preprint"},{"key":"ref15","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"dosovitskiy","year":"0","journal-title":"ICLRE"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01621"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00025"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3088605"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.385"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00015"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46466-4_41"},{"key":"ref6","first-page":"248","article-title":"Imagenet: A large-scale hierarchical image database","author":"deng","year":"2009","journal-title":"CVPR"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICME46284.2020.9102906"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2019.00113"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2491929"},{"key":"ref2","article-title":"The hateful memes challenge: Detecting hate speech in multimodal memes","volume":"33","author":"kiela","year":"2020","journal-title":"NeurIPS"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00532"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00700"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.319"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"ref21","first-page":"740","article-title":"Microsoft coco: Common objects in context","author":"lin","year":"2014","journal-title":"ECCV"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6964"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0733-5"},{"key":"ref26","first-page":"464","article-title":"Multi-label image recognition by recurrently dis-covering attentional regions","author":"wang","year":"0","journal-title":"ICCV"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58589-1_39"}],"event":{"name":"2022 IEEE International Conference on Multimedia and Expo (ICME)","start":{"date-parts":[[2022,7,18]]},"location":"Taipei, Taiwan","end":{"date-parts":[[2022,7,22]]}},"container-title":["2022 IEEE International Conference on Multimedia and Expo (ICME)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9859562\/9858923\/09859991.pdf?arnumber=9859991","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,19]],"date-time":"2022-09-19T20:24:53Z","timestamp":1663619093000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9859991\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7,18]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icme52920.2022.9859991","relation":{},"subject":[],"published":{"date-parts":[[2022,7,18]]}}}