{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,26]],"date-time":"2026-06-26T01:33:12Z","timestamp":1782437592424,"version":"3.54.5"},"reference-count":60,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100013148","name":"Science and Technology Foundation of State Grid Corporation of China","doi-asserted-by":"publisher","award":["52789921001M"],"award-info":[{"award-number":["52789921001M"]}],"id":[{"id":"10.13039\/501100013148","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE J. Sel. Top. Appl. Earth Observations Remote Sensing"],"published-print":{"date-parts":[[2022]]},"DOI":"10.1109\/jstars.2022.3145042","type":"journal-article","created":{"date-parts":[[2022,1,25]],"date-time":"2022-01-25T20:33:38Z","timestamp":1643142818000},"page":"1884-1901","source":"Crossref","is-referenced-by-count":31,"title":["Transformer-Driven Semantic Relation Inference for Multilabel Classification of High-Resolution Remote Sensing Images"],"prefix":"10.1109","volume":"15","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4497-4352","authenticated-orcid":false,"given":"Xiaowei","family":"Tan","sequence":"first","affiliation":[{"name":"State Key Laboratory of Information Engineering in Surveying, Mapping, and Remote Sensing, Wuhan University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8239-2268","authenticated-orcid":false,"given":"Zhifeng","family":"Xiao","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Information Engineering in Surveying, Mapping, and Remote Sensing, Wuhan University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jianjun","family":"Zhu","sequence":"additional","affiliation":[{"name":"National Bio Energy Company Ltd., Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qiao","family":"Wan","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Information Engineering in Surveying, Mapping, and Remote Sensing, Wuhan University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kai","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Remote Sensing and Information Engineering, Wuhan University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Deren","family":"Li","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Information Engineering in Surveying, Mapping, and Remote Sensing, Wuhan University, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","first-page":"19","article-title":"Very deep convolutional networks for large-scale image recognition","volume-title":"Proc. 3rd Int. Conf. Learn. Representations","author":"Simonyan","year":"2015"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.4324\/9781410605337-29"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2018.2869101"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3390\/rs13010073"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2020.2976551"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.3045634"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1117\/1.JRS.11.016017"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3788\/OPE.20172501.0198"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2021.3075712"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3071369"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2019.2960026"},{"key":"ref14","first-page":"2027","article-title":"Learning spatial regularization with image-level supervisions for multi-label image classification","volume-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","author":"Feng","year":"2017"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2491929"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-77380-3_30"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2019.2963364"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2020.2979552"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2021.3091134"},{"key":"ref20","first-page":"1691","article-title":"Generative pretraining from pixels","volume-title":"Proc. Int. Conf. Mach. Learn.","volume":"119","author":"Chen","year":"2020"},{"key":"ref21","article-title":"An image is worth 1616 words: Transformers for image recognition at scale","volume-title":"Int. Conf. Learn. Representations","author":"Dosovitskiy","year":"2021"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2004.03.009"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2014.12.011"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-04174-7_17"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-008-5064-8"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-74958-5_38"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2006.12.019"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/1120.003.0092"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-44794-6_4"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.21236\/ADA440081"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.414"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_26"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.37"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.251"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.58"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.325"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00532"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00061"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6909"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2019.01.015"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2995805"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.3390\/rs12071110"},{"key":"ref43","first-page":"1300","article-title":"Multi-label classification using conditional dependency networks","volume-title":"Proc. 22nd Int. Joint Conf. Artif. Intell.","author":"Guo"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2007.383230"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299037"},{"key":"ref46","first-page":"430","article-title":"Multi-label image classification with a probabilistic label enhancement model","volume-title":"Proc. 30th Conf. Uncertainty Artif. Intell.","author":"Li","year":"2014"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.5220\/0008940304940505"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00532"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.3390\/rs12234003"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2019.05.024"},{"key":"ref51","first-page":"2204","article-title":"Recurrent models of visual attention","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Mnih","year":"2014"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1146\/annurev.neuro.26.041002.131047"},{"key":"ref53","first-page":"6000","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Vaswani","year":"2017"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref55","article-title":"Transunet: Transformers make strong encoders for medical image segmentation","author":"Chen","year":"2021"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2021.3109061"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.319"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2760909"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2020.09.020"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2017.2671922"}],"container-title":["IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/4609443\/9656571\/09691842.pdf?arnumber=9691842","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,13]],"date-time":"2024-01-13T22:18:57Z","timestamp":1705184337000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9691842\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"references-count":60,"URL":"https:\/\/doi.org\/10.1109\/jstars.2022.3145042","relation":{},"ISSN":["1939-1404","2151-1535"],"issn-type":[{"value":"1939-1404","type":"print"},{"value":"2151-1535","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]}}}