{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:44:04Z","timestamp":1767339844569,"version":"3.28.0"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T00:00:00Z","timestamp":1684281600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T00:00:00Z","timestamp":1684281600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,17]]},"DOI":"10.1109\/jurse57346.2023.10144168","type":"proceedings-article","created":{"date-parts":[[2023,6,8]],"date-time":"2023-06-08T17:28:26Z","timestamp":1686245306000},"page":"1-4","source":"Crossref","is-referenced-by-count":4,"title":["Building Usage Classification Using a Transformer-based Multimodal Deep Learning Method"],"prefix":"10.1109","author":[{"given":"Wen","family":"Zhou","sequence":"first","affiliation":[{"name":"University of Twente,TC Faculty,Dept. of Earth Observation Science,Enschede,The Netherlands"}]},{"given":"Claudio","family":"Persello","sequence":"additional","affiliation":[{"name":"University of Twente,TC Faculty,Dept. of Earth Observation Science,Enschede,The Netherlands"}]},{"given":"Alfred","family":"Stein","sequence":"additional","affiliation":[{"name":"University of Twente,TC Faculty,Dept. of Earth Observation Science,Enschede,The Netherlands"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2021.3107543"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2019.111458"},{"journal-title":"Code for classification of urban land use and planning standards of development land[S]","year":"2018","key":"ref15"},{"key":"ref14","article-title":"Attention Is All You Need","author":"ashish","year":"2017","journal-title":"31st Conference on Neural Information Processing Systems (NIPS 2017)"},{"key":"ref20","first-page":"218","article-title":"A Comparative Analysis of Classification Methods to Multi-label Tasks in Different Application Domainsf","volume":"3","author":"santos","year":"2011","journal-title":"International Journal of Computer Information Systems and Industrial Management Applications"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2018.04.050"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3281548.3281559"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2021.06.010"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2019.04.014"},{"journal-title":"Supervised multimodal bitransformers for classifying images and text","year":"2020","author":"kiela","key":"ref17"},{"key":"ref16","article-title":"An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale","author":"dosovitskiy","year":"2020","journal-title":"ICLRE"},{"key":"ref19","first-page":"3549","author":"zhang","year":"0","journal-title":"ResNet or DenseNet? Introducing Dense Shortcuts to ResNet"},{"key":"ref18","first-page":"4171","article-title":"BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding","author":"devlin","year":"2019","journal-title":"In Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics Human Language Technologies"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2018.05.006"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2018.06.034"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2015.2488681"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2798607"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/S1361-9209(96)00010-7"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2022.04.006"},{"key":"ref5","first-page":"2425","author":"antol","year":"0","journal-title":"Vqa Visual question answering"}],"event":{"name":"2023 Joint Urban Remote Sensing Event (JURSE)","start":{"date-parts":[[2023,5,17]]},"location":"Heraklion, Greece","end":{"date-parts":[[2023,5,19]]}},"container-title":["2023 Joint Urban Remote Sensing Event (JURSE)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10144111\/10144082\/10144168.pdf?arnumber=10144168","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,26]],"date-time":"2023-06-26T18:01:08Z","timestamp":1687802468000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10144168\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,17]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/jurse57346.2023.10144168","relation":{},"subject":[],"published":{"date-parts":[[2023,5,17]]}}}