{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:02:13Z","timestamp":1777654933596,"version":"3.51.4"},"reference-count":83,"publisher":"Tsinghua University Press","issue":"3","license":[{"start":{"date-parts":[[2023,9,1]],"date-time":"2023-09-01T00:00:00Z","timestamp":1693526400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2023,3,8]],"date-time":"2023-03-08T00:00:00Z","timestamp":1678233600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Comp. Visual. Med."],"published-print":{"date-parts":[[2023,9]]},"DOI":"10.1007\/s41095-022-0325-1","type":"journal-article","created":{"date-parts":[[2023,3,8]],"date-time":"2023-03-08T13:02:50Z","timestamp":1678280570000},"page":"563-579","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":26,"title":["D2ANet: Difference-aware attention network for multi-level change detection from satellite imagery"],"prefix":"10.26599","volume":"9","author":[{"given":"Jie","family":"Mei","sequence":"first","affiliation":[{"name":"TMCC, CS, Nankai University, Tianjin 300350, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yi-Bo","family":"Zheng","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Earth Surface Processes and Resource Ecology, Faculty of Geographical Science, Beijing Normal University, Beijing 100875, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ming-Ming","family":"Cheng","sequence":"additional","affiliation":[{"name":"TMCC, CS, Nankai University, Tianjin 300350, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"11138","reference":[{"issue":"10","key":"325_CR1","doi-asserted-by":"publisher","first-page":"1688","DOI":"10.3390\/rs12101688","volume":"12","author":"W Z Shi","year":"2020","unstructured":"Shi, W. Z.; Zhang, M.; Zhang, R.; Chen, S. X.; Zhan, Z. Change detection based on artificial intelligence: State-of-the-art and challenges. Remote Sensing Vol. 12, No. 10, 1688, 2020.","journal-title":"Remote Sensing"},{"issue":"12","key":"325_CR2","doi-asserted-by":"publisher","first-page":"6408","DOI":"10.3390\/rs5126408","volume":"5","author":"C F Chen","year":"2013","unstructured":"Chen, C. F.; Son, N. T.; Chang, N. B.; Chen, C. R.; Chang, L. Y.; Valdez, M.; Centeno, G.; Thompson, C. A.; Aceituno, J. L. Multi-decadal mangrove forest change detection and prediction in Honduras, central America, with landsat imagery and a Markov chain model. Remote Sensing Vol. 5, No. 12, 6408\u20136426, 2013.","journal-title":"Remote Sensing"},{"issue":"3","key":"325_CR3","doi-asserted-by":"publisher","first-page":"1177","DOI":"10.1109\/TNNLS.2020.2980749","volume":"32","author":"L Y Li","year":"2021","unstructured":"Li, L. Y.; Yan, J. C.; Wang, H. Y.; Jin, Y. H. Anomaly detection of time series with smoothness-inducing sequential variational auto-encoder. IEEE Transactions on Neural Networks and Learning Systems Vol. 32, No. 3, 1177\u20131191, 2021.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"issue":"16","key":"325_CR4","doi-asserted-by":"publisher","first-page":"1854","DOI":"10.3390\/rs11161854","volume":"11","author":"S Mahdavi","year":"2019","unstructured":"Mahdavi, S.; Salehi, B.; Huang, W. M.; Amani, M.; Brisco, B. A PolSAR change detection index based on neighborhood information for flood mapping. Remote Sensing Vol. 11, No. 16, 1854, 2019.","journal-title":"Remote Sensing"},{"key":"325_CR5","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.ins.2018.04.092","volume":"460\u2013461","author":"J Y Kim","year":"2018","unstructured":"Kim, J. Y.; Bu, S. J.; Cho, S. B. Zero-day malware detection using transferred generative adversarial networks based on deep autoencoders. Information Sciences Vols. 460\u2013461, 83\u2013102, 2018.","journal-title":"Information Sciences"},{"issue":"1","key":"325_CR6","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1016\/j.jbi.2012.08.004","volume":"46","author":"M Hauskrecht","year":"2013","unstructured":"Hauskrecht, M.; Batal, I.; Valko, M.; Visweswaran, S.; Cooper, G. F.; Clermont, G. Outlier detection for patient monitoring and alerting. Journal of Biomedical Informatics Vol. 46, No. 1, 47\u201355, 2013.","journal-title":"Journal of Biomedical Informatics"},{"issue":"6","key":"325_CR7","doi-asserted-by":"publisher","first-page":"989","DOI":"10.1080\/01431168908903939","volume":"10","author":"A Singh","year":"1989","unstructured":"Singh, A. Digital change detection techniques using remotely-sensed data. International Journal of Remote Sensing Vol. 10, No. 6, 989\u20131003, 1989.","journal-title":"International Journal of Remote Sensing"},{"issue":"3","key":"325_CR8","doi-asserted-by":"publisher","first-page":"326","DOI":"10.1016\/j.rse.2005.09.008","volume":"99","author":"J Im","year":"2005","unstructured":"Im, J.; Jensen, J. R. A change detection model based on neighborhood correlation image analysis and decision tree classification. Remote Sensing of Environment Vol. 99, No. 3, 326\u2013340, 2005.","journal-title":"Remote Sensing of Environment"},{"issue":"8","key":"325_CR9","doi-asserted-by":"publisher","first-page":"1815","DOI":"10.1109\/TGRS.2002.802498","volume":"40","author":"T Kasetkasem","year":"2002","unstructured":"Kasetkasem, T.; Varshney, P. K. An image change detection algorithm based on Markov random field models. IEEE Transactions on Geoscience and Remote Sensing Vol. 40, No. 8, 1815\u20131823, 2002.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"325_CR10","doi-asserted-by":"crossref","unstructured":"Gueguen, L.; Hamid, R. Large-scale damage detection using satellite imagery. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 1321\u20131328, 2015.","DOI":"10.1109\/CVPR.2015.7298737"},{"issue":"4","key":"325_CR11","doi-asserted-by":"publisher","first-page":"1822","DOI":"10.1109\/TIP.2017.2784560","volume":"27","author":"Z G Liu","year":"2018","unstructured":"Liu, Z. G.; Li, G.; Mercier, G.; He, Y.; Pan, Q. Change detection in heterogenous remote sensing images via homogeneous pixel transformation. IEEE Transactions on Image Processing Vol. 27, No. 4, 1822\u20131834, 2018.","journal-title":"IEEE Transactions on Image Processing"},{"key":"325_CR12","doi-asserted-by":"publisher","unstructured":"Fu, J.; Liu, J.; Wang, Y. H.; Zhou, J.; Wang, C. Y.; Lu, H. Q. Stacked deconvolutional network for semantic segmentation. IEEE Transactions on Image Processing DOI: https:\/\/doi.org\/10.1109\/TIP.2019.2895460, 2019.","DOI":"10.1109\/TIP.2019.2895460"},{"key":"325_CR13","series-title":"Lecture Notes in Computer Science, Vol. 11211","doi-asserted-by":"publisher","first-page":"833","DOI":"10.1007\/978-3-030-01234-2_49","volume-title":"Computer Vision \u2014 ECCV 2018","author":"L C Chen","year":"2018","unstructured":"Chen, L. C.; Zhu, Y. K.; Papandreou, G.; Schroff, F.; Adam, H. Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Computer Vision \u2014 ECCV 2018. Lecture Notes in Computer Science, Vol. 11211. Ferrari, V.; Hebert, M.; Sminchisescu, C.; Weiss, Y. Eds. Springer Cham, 833\u2013851, 2018."},{"key":"325_CR14","unstructured":"Chen, L. C.; Papandreou, G.; Schroff, F.; Adam, H. Rethinking atrous convolution for semantic image segmentation. arXiv preprint arXiv:1706.05587, 2017."},{"issue":"5","key":"325_CR15","doi-asserted-by":"publisher","first-page":"811","DOI":"10.1109\/LGRS.2020.2988032","volume":"18","author":"Y Liu","year":"2021","unstructured":"Liu, Y.; Pang, C.; Zhan, Z. Q.; Zhang, X. M.; Yang, X. Building change detection for remote sensing images using a dual-task constrained deep Siamese convolutional network model. IEEE Geoscience and Remote Sensing Letters Vol. 18, No. 5, 811\u2013815, 2021.","journal-title":"IEEE Geoscience and Remote Sensing Letters"},{"issue":"2","key":"325_CR16","doi-asserted-by":"publisher","first-page":"205","DOI":"10.3390\/rs12020205","volume":"12","author":"M Y Wang","year":"2020","unstructured":"Wang, M. Y.; Tan, K.; Jia, X. P.; Wang, X.; Chen, Y. A deep Siamese network with hybrid convolutional feature extraction module for change detection based on multi-sensor remote sensing images. Remote Sensing Vol. 12, No. 2, 205, 2020.","journal-title":"Remote Sensing"},{"key":"325_CR17","unstructured":"Xu, J. Z.; Lu, W. H.; Li, Z. B.; Khaitan, P.; Zaytseva, V. Building damage detection in satellite imagery using convolutional neural networks. arXiv preprint arXiv:1910.06444, 2019."},{"key":"325_CR18","doi-asserted-by":"crossref","unstructured":"Zhu, X. Y.; Liang, J. W.; Hauptmann, A. MSNet: A multilevel instance segmentation network for natural disaster damage assessment in aerial videos. In: Proceedings of the IEEE Winter Conference on Applications of Computer Vision, 2022\u20132031, 2021.","DOI":"10.1109\/WACV48630.2021.00207"},{"issue":"11","key":"325_CR19","doi-asserted-by":"publisher","first-page":"1689","DOI":"10.3390\/rs10111689","volume":"10","author":"M Ji","year":"2018","unstructured":"Ji, M.; Liu, L. F.; Buchroithner, M. Identifying collapsed buildings using post-earthquake satellite imagery and convolutional neural networks: A case study of the 2010 Haiti earthquake. Remote Sensing Vol. 10, No. 11, 1689, 2018","journal-title":"Remote Sensing"},{"key":"325_CR20","unstructured":"Gupta, R.; Goodman, B.; Patel, N.; Hosfelt, R.; Sajeev, S.; Heim, E.; Doshi, J.; Lucas, K.; Choset, H.; Gaston, M. Creating xBD: A dataset for assessing building damage from satellite imagery. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, 10\u201317, 2019."},{"issue":"5","key":"325_CR21","doi-asserted-by":"publisher","first-page":"905","DOI":"10.3390\/rs13050905","volume":"13","author":"C Y Wu","year":"2021","unstructured":"Wu, C. Y.; Zhang, F.; Xia, J. S.; Xu, Y. C.; Li, G. Q.; Xie, J. B.; Du, Z.; Liu, R. Building damage detection using U-net with attention mechanism from pre- and post-disaster remote sensing datasets. Remote Sensing Vol. 13, No. 5, 905, 2021.","journal-title":"Remote Sensing"},{"issue":"5","key":"325_CR22","doi-asserted-by":"publisher","first-page":"2664","DOI":"10.1109\/TGRS.2014.2363548","volume":"53","author":"C Marin","year":"2015","unstructured":"Marin, C.; Bovolo, F.; Bruzzone, L. Building change detection in multitemporal very high resolution SAR images. IEEE Transactions on Geoscience and Remote Sensing Vol. 53, No. 5, 2664\u20132682, 2015.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"issue":"4","key":"325_CR23","doi-asserted-by":"publisher","first-page":"884","DOI":"10.1109\/TCYB.2016.2531179","volume":"47","author":"X Q Lu","year":"2017","unstructured":"Lu, X. Q.; Yuan, Y.; Zheng, X. T. Joint dictionary learning for multispectral change detection. IEEE Transactions on Cybernetics Vol. 47, No. 4, 884\u2013897, 2017.","journal-title":"IEEE Transactions on Cybernetics"},{"issue":"13","key":"325_CR24","doi-asserted-by":"publisher","first-page":"1525","DOI":"10.3390\/rs11131525","volume":"11","author":"J J Gapper","year":"2019","unstructured":"Gapper, J. J.; El-Askary, H.; Linstead, E.; Piechota, T. Coral reef change detection in remote Pacific Islands using support vector machine classifiers. Remote Sensing Vol. 11, No. 13, 1525, 2019.","journal-title":"Remote Sensing"},{"issue":"12","key":"325_CR25","doi-asserted-by":"publisher","first-page":"3978","DOI":"10.1109\/TGRS.2007.907109","volume":"45","author":"P Zhong","year":"2007","unstructured":"Zhong, P.; Wang, R. S. A multiple conditional random fields ensemble model for urban area detection in remote sensing optical images. IEEE Transactions on Geoscience and Remote Sensing Vol. 45, No. 12, 3978\u20133988, 2007.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"issue":"2","key":"325_CR26","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1016\/j.isprsjprs.2006.09.004","volume":"61","author":"H Nemmour","year":"2006","unstructured":"Nemmour, H.; Chibani, Y. Multiple support vector machines for land cover change detection: An application for mapping urban extensions. ISPRS Journal of Photogrammetry and Remote Sensing Vol. 61, No. 2, 125\u2013133, 2006.","journal-title":"ISPRS Journal of Photogrammetry and Remote Sensing"},{"key":"325_CR27","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1109\/TIP.2020.3031173","volume":"30","author":"Y J Lei","year":"2021","unstructured":"Lei, Y. J.; Peng, D.; Zhang, P. P.; Ke, Q. H.; Li, H. F. Hierarchical paired channel fusion network for street scene change detection. IEEE Transactions on Image Processing Vol. 30, 55\u201367, 2021.","journal-title":"IEEE Transactions on Image Processing"},{"key":"325_CR28","doi-asserted-by":"crossref","unstructured":"Caye Daudt, R.; Le Saux, B.; Boulch, A. Fully convolutional Siamese networks for change detection. In: Proceedings of the 25th IEEE International Conference on Image Processing, 4063\u20134067, 2018.","DOI":"10.1109\/ICIP.2018.8451652"},{"key":"325_CR29","doi-asserted-by":"crossref","unstructured":"Daudt, R. C.; Le Saux, B.; Boulch, A.; Gousseau, Y. Guided anisotropic diffusion and iterative learning for weakly supervised change detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, 1461\u20131470, 2019.","DOI":"10.1109\/CVPRW.2019.00187"},{"key":"325_CR30","doi-asserted-by":"crossref","unstructured":"Papadomanolaki, M.; Verma, S.; Vakalopoulou, M.; Gupta, S.; Karantzalos, K. Detecting urban changes with recurrent neural networks from multitemporal sentinel-2 data. In: Proceedings of the IEEE International Geoscience and Remote Sensing Symposium, 214\u2013217, 2019.","DOI":"10.1109\/IGARSS.2019.8900330"},{"issue":"11","key":"325_CR31","doi-asserted-by":"publisher","first-page":"12084","DOI":"10.1109\/TCYB.2021.3086884","volume":"52","author":"C Wu","year":"2022","unstructured":"Wu, C.; Chen, H.; Du, B.; Zhang, L. P. Unsupervised change detection in multitemporal VHR images based on deep kernel PCA convolutional mapping network. IEEE Transactions on Cybernetics Vol. 52, No. 11, 12084\u201312098, 2022.","journal-title":"IEEE Transactions on Cybernetics"},{"key":"325_CR32","doi-asserted-by":"publisher","unstructured":"Li, L. Y.; Yan, J. C.; Wen, Q. S.; Jin, Y. H.; Yang, X. K. Learning robust deep state space for unsupervised anomaly detection in contaminated time-series. IEEE Transactions on Knowledge and Data Engineering DOI: https:\/\/doi.org\/10.1109\/TKDE.2022.3171562, 2022.","DOI":"10.1109\/TKDE.2022.3171562"},{"issue":"2","key":"325_CR33","doi-asserted-by":"publisher","first-page":"89","DOI":"10.5194\/isprs-annals-IV-2-89-2018","volume":"IV","author":"D Duarte","year":"2018","unstructured":"Duarte, D.; Nex, F.; Kerle, N.; Vosselman, G. Satellite image classification of building damages using airborne and satellite image samples in a deep learning approach. ISPRS Annals of the Photogrammetry, Remote Sensing and Spatial Information Sciences Vol. IV, No. 2, 89\u201396, 2018.","journal-title":"ISPRS Annals of the Photogrammetry, Remote Sensing and Spatial Information Sciences"},{"issue":"1","key":"325_CR34","doi-asserted-by":"publisher","first-page":"702","DOI":"10.1609\/aaai.v33i01.3301702","volume":"33","author":"T G J Rudner","year":"2019","unstructured":"Rudner, T. G. J.; Ru\u00dfwurm, M.; Fil, J.; Pelich, R.; Bischke, B.; Kopa\u010dkov\u00e1, V.; Bilinski, P. Multi3Net: Segmenting flooded buildings via fusion of multiresolution, multisensor, and multitemporal satellite imagery. Proceedings of the AAAI Conference on Artificial Intelligence Vol. 33, No. 1, 702\u2013709, 2019.","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"325_CR35","series-title":"Lecture Notes in Computer Science, Vol. 9351","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1007\/978-3-319-24574-4_28","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2014 MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger, O.; Fischer, P.; Brox, T. U-Net: Convolutional networks for biomedical image segmentation. In: Medical Image Computing and Computer-Assisted Intervention \u2014 MICCAI 2015. Lecture Notes in Computer Science, Vol. 9351. Navab, N.; Hornegger, J.; Wells, W.; Frangi, A. Eds. Springer Cham, 234\u2013241, 2015."},{"key":"325_CR36","doi-asserted-by":"crossref","unstructured":"He, K. M.; Zhang, X. Y.; Ren, S. Q.; Sun, J. Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 770\u2013778, 2016.","DOI":"10.1109\/CVPR.2016.90"},{"key":"325_CR37","unstructured":"Weber, E.; Kan\u00e9, H. Building disaster damage assessment in satellite imagery with multi-temporal fusion. In: Proceedings of the International Conference on Learning Representations Workshop, 2020."},{"key":"325_CR38","doi-asserted-by":"crossref","unstructured":"He, K. M.; Gkioxari, G.; Doll\u00e1r, P.; Girshick, R. Mask R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, 2980\u20132988, 2017.","DOI":"10.1109\/ICCV.2017.322"},{"key":"325_CR39","doi-asserted-by":"crossref","unstructured":"Lin, T. Y.; Doll\u00e1r, P.; Girshick, R.; He, K. M.; Hariharan, B.; Belongie, S. Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 936\u2013944, 2017.","DOI":"10.1109\/CVPR.2017.106"},{"key":"325_CR40","doi-asserted-by":"crossref","unstructured":"Shen, Y.; Zhu, S. J.; Yang, T.; Chen, C.; Pan, D. L.; Chen, J. Y.; Xiao, L.; Du, Q. BDANet: Multiscale convolutional neural network with cross-directional attention for building damage assessment from satellite images. IEEE Transactions on Geoscience and Remote Sensing Vol. 60, Article No. 5402114, 2022.","DOI":"10.1109\/TGRS.2021.3080580"},{"issue":"4","key":"325_CR41","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1016\/S0924-2716(02)00062-X","volume":"56","author":"H R\u00fcther","year":"2002","unstructured":"R\u00fcther, H.; Martine, H. M.; Mtalo, E. G. Application of snakes and dynamic programming optimisation technique in modeling of buildings in informal settlement areas. ISPRS Journal of Photogrammetry and Remote Sensing Vol. 56, No. 4, 269\u2013282, 2002.","journal-title":"ISPRS Journal of Photogrammetry and Remote Sensing"},{"issue":"6","key":"325_CR42","doi-asserted-by":"publisher","first-page":"1661","DOI":"10.1109\/TGRS.2006.869980","volume":"44","author":"V J D Tsai","year":"2006","unstructured":"Tsai, V. J. D. A comparative study on shadow compensation of color aerial images in invariant color models. IEEE Transactions on Geoscience and Remote Sensing Vol. 44, No. 6, 1661\u20131671, 2006.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"325_CR43","doi-asserted-by":"crossref","unstructured":"Sirmacek, B.; Unsalan, C. Building detection from aerial images using invariant color features and shadow information. In: Proceedings of the 23rd International Symposium on Computer and Information Sciences, 1\u20135, 2008.","DOI":"10.1109\/ISCIS.2008.4717854"},{"key":"325_CR44","doi-asserted-by":"crossref","unstructured":"Long, J.; Shelhamer, E.; Darrell, T. Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 3431\u20133440, 2015.","DOI":"10.1109\/CVPR.2015.7298965"},{"issue":"3","key":"325_CR45","doi-asserted-by":"publisher","first-page":"1120","DOI":"10.1109\/TCYB.2018.2885062","volume":"50","author":"D Lin","year":"2020","unstructured":"Lin, D.; Zhang, R. M.; Ji, Y. F.; Li, P.; Huang, H. SCN: Switchable context network for semantic segmentation of RGB-D images. IEEE Transactions on Cybernetics Vol. 50, No. 3, 1120\u20131131, 2020.","journal-title":"IEEE Transactions on Cybernetics"},{"issue":"4","key":"325_CR46","doi-asserted-by":"publisher","first-page":"1731","DOI":"10.1109\/TCYB.2020.2969046","volume":"51","author":"J Yu","year":"2021","unstructured":"Yu, J.; Yao, J. H.; Zhang, J.; Yu, Z.; Tao, D. C. SPRNet: Single-pixel reconstruction for one-stage instance segmentation. IEEE Transactions on Cybernetics Vol. 51, No. 4, 1731\u20131742, 2021.","journal-title":"IEEE Transactions on Cybernetics"},{"issue":"12","key":"325_CR47","doi-asserted-by":"publisher","first-page":"12661","DOI":"10.1109\/TCYB.2021.3085856","volume":"52","author":"B Bovcon","year":"2022","unstructured":"Bovcon, B.; Kristan, M. WaSR\u2014A water segmentation and refinement maritime obstacle detection network. IEEE Transactions on Cybernetics Vol. 52, No. 12, 12661\u201312674, 2022.","journal-title":"IEEE Transactions on Cybernetics"},{"issue":"2","key":"325_CR48","doi-asserted-by":"publisher","first-page":"2384","DOI":"10.1109\/TPAMI.2022.3166956","volume":"45","author":"X Yang","year":"2023","unstructured":"Yang, X.; Yan, J. C.; Liao, W. L.; Yang, X. K.; Tang, J.; He, T. SCRDet: Detecting small, cluttered and rotated objects via instance-level feature denoising and rotation loss smoothing. IEEE Transactions on Pattern Analysis and Machine Intelligence Vol. 45, No. 2, 2384\u20132399, 2023.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"5","key":"325_CR49","doi-asserted-by":"publisher","first-page":"1340","DOI":"10.1007\/s11263-022-01593-w","volume":"130","author":"X Yang","year":"2022","unstructured":"Yang, X.; Yan, J. C. On the arbitrary-oriented object detection: Classification based approaches revisited. International Journal of Computer Vision Vol. 130, No. 5, 1340\u20131365, 2022.","journal-title":"International Journal of Computer Vision"},{"key":"325_CR50","unstructured":"Van Etten, A.; Lindenbaum, D.; Bacastow, T. M. SpaceNet: A remote sensing dataset and challenge series. arXiv preprint arXiv:1807.01232, 2018."},{"key":"325_CR51","doi-asserted-by":"crossref","unstructured":"Demir, I.; Koperski, K.; Lindenbaum, D.; Pang, G.; Huang, J.; Basu, S.; Hughes, F.; Tuia, D.; Raska, R. DeepGlobe 2018: A challenge to parse the earth through satellite images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, 172\u201317209, 2018.","DOI":"10.1109\/CVPRW.2018.00031"},{"key":"325_CR52","doi-asserted-by":"crossref","unstructured":"Hamaguchi, R.; Hikosaka, S. Building detection from satellite imagery using ensemble of size-specific detectors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, 223\u20132234, 2018.","DOI":"10.1109\/CVPRW.2018.00041"},{"key":"325_CR53","doi-asserted-by":"crossref","unstructured":"Golovanov, S.; Kurbanov, R.; Artamonov, A.; Davydow, A.; Nikolenko, S. Building detection from satellite imagery using a composite loss function. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, 219\u2013222, 2018.","DOI":"10.1109\/CVPRW.2018.00040"},{"key":"325_CR54","doi-asserted-by":"crossref","unstructured":"Chaurasia, A.; Culurciello, E. LinkNet: Exploiting encoder representations for efficient semantic segmentation. In: Proceedings of the IEEE Visual Communications and Image Processing, 1\u20134, 2018.","DOI":"10.1109\/VCIP.2017.8305148"},{"issue":"11","key":"325_CR55","doi-asserted-by":"publisher","first-page":"2793","DOI":"10.1109\/TPAMI.2017.2750680","volume":"40","author":"J Y Yuan","year":"2018","unstructured":"Yuan, J. Y. Learning building extraction in aerial scenes with convolutional networks. IEEE Transactions on Pattern Analysis and Machine Intelligence Vol. 40, No. 11, 2793\u20132798, 2018.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"5","key":"325_CR56","doi-asserted-by":"publisher","first-page":"446","DOI":"10.3390\/rs9050446","volume":"9","author":"H Z Wang","year":"2017","unstructured":"Wang, H. Z.; Wang, Y.; Zhang, Q.; Xiang, S. M.; Pan, C. H. Gated convolutional neural network for semantic segmentation in high-resolution images. Remote Sensing Vol. 9, No. 5, 446, 2017.","journal-title":"Remote Sensing"},{"issue":"8","key":"325_CR57","doi-asserted-by":"publisher","first-page":"917","DOI":"10.3390\/rs11080917","volume":"11","author":"X R Pan","year":"2019","unstructured":"Pan, X. R.; Yang, F.; Gao, L. R.; Chen, Z. C.; Zhang, B.; Fan, H. R.; Ren, J. Building extraction from high-resolution aerial imagery using a generative adversarial network with spatial and channel attention mechanisms. Remote Sensing Vol. 11, No. 8, 917, 2019.","journal-title":"Remote Sensing"},{"key":"325_CR58","doi-asserted-by":"crossref","unstructured":"Zhao, K.; Kang, J.; Jung, J.; Sohn, G. Building extraction from satellite images using mask R-CNN with building boundary regularization. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, 242\u2013246, 2018.","DOI":"10.1109\/CVPRW.2018.00045"},{"key":"325_CR59","unstructured":"Vaswani, A.; Shazeer, N.; Parmar, N.; Uszkoreit, J.; Jones, L.; Gomez, A. N.; Kaiser, L; Polosukhin, I. Attention is all you need. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, 6000\u20136010, 2017."},{"key":"325_CR60","doi-asserted-by":"crossref","unstructured":"Wang, X. L.; Girshick, R.; Gupta, A.; He, K. M. Non-local neural networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 7794\u20137803, 2018.","DOI":"10.1109\/CVPR.2018.00813"},{"key":"325_CR61","doi-asserted-by":"crossref","unstructured":"Huang, Z. L.; Wang, X. G.; Huang, L. C.; Huang, C.; Wei, Y. C.; Liu, W. Y. CCNet: Criss-cross attention for semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 603\u2013612, 2019.","DOI":"10.1109\/ICCV.2019.00069"},{"issue":"8","key":"325_CR62","first-page":"4374","volume":"44","author":"J Mei","year":"2022","unstructured":"Mei, J.; Cheng, M. M.; Xu, G.; Wan, L. R.; Zhang, H. SANet: A slice-aware network for pulmonary nodule detection. IEEE Transactions on Pattern Analysis and Machine Intelligence Vol. 44, No. 8, 4374\u20134387, 2022.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"325_CR63","doi-asserted-by":"crossref","unstructured":"Bello, I.; Zoph, B.; Le, Q.; Vaswani, A.; Shlens, J. Attention augmented convolutional networks. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 3285\u20133294, 2019.","DOI":"10.1109\/ICCV.2019.00338"},{"key":"325_CR64","unstructured":"Ramachandran, P.; Parmar, N.; Vaswani, A.; Bello, I.; Levskaya, A.; Shlens, J. Stand-alone self-attention in vision models. In: Proceedings of the 33rd International Conference on Neural Information Processing Systems, Article No. 7, 68\u201380, 2019."},{"key":"325_CR65","doi-asserted-by":"crossref","unstructured":"Zhao, H. S.; Jia, J. Y.; Koltun, V. Exploring self-attention for image recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 10073\u201310082, 2020.","DOI":"10.1109\/CVPR42600.2020.01009"},{"key":"325_CR66","series-title":"Lecture Notes in Computer Science, Vol. 12349","first-page":"108","volume-title":"Computer Vision \u2014 ECCV 2020","author":"H Wang","year":"2020","unstructured":"Wang, H.; Zhu, Y.; Green, B.; Adam, H.; Yuille, A.; Chen, L. C. Axial-DeepLab: Stand-alone axial-attention for panoptic segmentation. In: Computer Vision \u2014 ECCV 2020. Lecture Notes in Computer Science, Vol. 12349. Vedaldi, A.; Bischof, H.; Brox, T.; Frahm, J. M. Eds. Springer Cham, 108\u2013126, 2020."},{"key":"325_CR67","doi-asserted-by":"crossref","unstructured":"Wang, Y.; Peng, J. J.; Wang, H. B.; Wang, M. Progressive learning with multi-scale attention network for cross-domain vehicle re-identification. Science China Information Sciences Vol. 65, No. 6, Article No. 160103, 2022.","DOI":"10.1007\/s11432-021-3383-y"},{"issue":"3","key":"325_CR68","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1007\/s41095-022-0271-y","volume":"8","author":"M H Guo","year":"2022","unstructured":"Guo, M. H.; Xu, T. X.; Liu, J. J.; Liu, Z. N.; Jiang, P. T.; Mu, T. J.; Zhang, S. H.; Martin, R. R.; Cheng, M. M.; Hu, S. M. Attention mechanisms in computer vision: A survey. Computational Visual Media Vol. 8, No. 3, 331\u2013368, 2022.","journal-title":"Computational Visual Media"},{"key":"325_CR69","unstructured":"Dosovitskiy, A.; Beyer, L.; Kolesnikov, A.; Weissenborn, D.; Zhai, X.; Unterthiner, T.; Dehghani, M.; Minderer, M.; Heigold, G.; Gelly, S.; et al. An Image is worth 16\u00d716 words: Transformers for image recognition at scale. In: Proceedings of the 9th International Conference on Learning Representations, 2021."},{"issue":"1","key":"325_CR70","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/s41095-021-0247-3","volume":"8","author":"Y F Xu","year":"2022","unstructured":"Xu, Y. F.; Wei, H. P.; Lin, M. X.; Deng, Y. Y.; Sheng, K. K.; Zhang, M. D.; Tang, F.; Dong, W.; Huang, F.; Xu, C. Transformers in computational visual media: A survey. Computational Visual Media Vol. 8, No. 1, 33\u201362, 2022.","journal-title":"Computational Visual Media"},{"key":"325_CR71","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1016\/j.compmedimag.2019.04.005","volume":"75","author":"S A Taghanaki","year":"2019","unstructured":"Taghanaki, S. A.; Zheng, Y. F.; Kevin Zhou, S.; Georgescu, B.; Sharma, P.; Xu, D. G.; Comaniciu, D.; Hamarneh, G. Combo loss: Handling input and output imbalance in multi-organ segmentation. Computerized Medical Imaging and Graphics Vol. 75, 24\u201333, 2019.","journal-title":"Computerized Medical Imaging and Graphics"},{"key":"325_CR72","doi-asserted-by":"crossref","unstructured":"Lin, T. Y.; Goyal, P.; Girshick, R.; He, K. M.; Doll\u00e1r, P. Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision, 2999\u20133007, 2017.","DOI":"10.1109\/ICCV.2017.324"},{"key":"325_CR73","doi-asserted-by":"crossref","unstructured":"Milletari, F.; Navab, N.; Ahmadi, S. A. V-net: Fully convolutional neural networks for volumetric medical image segmentation. In: Proceedings of the 4th International Conference on 3D Vision, 565\u2013571, 2016.","DOI":"10.1109\/3DV.2016.79"},{"key":"325_CR74","doi-asserted-by":"crossref","unstructured":"Hu, J.; Shen, L.; Sun, G. Squeeze-and-excitation networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 7132\u20137141, 2018.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"325_CR75","doi-asserted-by":"crossref","unstructured":"Chollet, F. Xception: Deep learning with depthwise separable convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 1800\u20131807, 2017.","DOI":"10.1109\/CVPR.2017.195"},{"key":"325_CR76","doi-asserted-by":"crossref","unstructured":"Xie, S. N.; Girshick, R.; Doll\u00e1r, P.; Tu, Z. W.; He, K. M. Aggregated residual transformations for deep neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 5987\u20135995, 2017.","DOI":"10.1109\/CVPR.2017.634"},{"key":"325_CR77","series-title":"Lecture Notes in Computer Science, Vol. 11217","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/978-3-030-01261-8_1","volume-title":"Computer Vision \u2014 ECCV 2018","author":"Y X Wu","year":"2018","unstructured":"Wu, Y. X.; He, K. M. Group normalization. In: Computer Vision \u2014 ECCV 2018. Lecture Notes in Computer Science, Vol. 11217. Ferrari, V.; Hebert, M.; Sminchisescu, C.; Weiss, Y. Eds. Springer Cham, 3\u201319, 2018."},{"key":"325_CR78","unstructured":"Paszke, A.; Gross, S.; Massa, F.; Lerer, A.; Bradbury, J.; Chanan, G.; Killeen, T.; Lin, Z.; Gimelshein, N.; Antiga, L.; et al. PyTorch: An imperative style, high-performance deep learning library. In: Proceedings of the 33rd International Conference on Neural Information Processing Systems, Article No. 721, 8026\u20138037, 2019."},{"issue":"10","key":"325_CR79","doi-asserted-by":"publisher","first-page":"3349","DOI":"10.1109\/TPAMI.2020.2983686","volume":"43","author":"J D Wang","year":"2021","unstructured":"Wang, J. D.; Sun, K.; Cheng, T. H.; Jiang, B. R.; Deng, C. R.; Zhao, Y.; Liu, D.; Mu, Y.; Tan, M.; Wang, X.; et al. Deep high-resolution representation learning for visual recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence Vol. 43, No. 10, 3349\u20133364, 2021.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"325_CR80","doi-asserted-by":"crossref","unstructured":"Gupta, R.; Shah, M. RescueNet: Joint building segmentation and damage assessment from satellite imagery. In: Proceedings of the 25th International Conference on Pattern Recognition, 4405\u20134411, 2021.","DOI":"10.1109\/ICPR48806.2021.9412295"},{"key":"325_CR81","doi-asserted-by":"crossref","unstructured":"Deng, J.; Dong, W.; Socher, R.; Li, L. J.; Kai, L.; Li, F. F. ImageNet: A large-scale hierarchical image database. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 248\u2013255, 2009.","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"325_CR82","unstructured":"Chen, Y.; Li, J.; Xiao, H.; Jin, X.; Yan, S.; Feng, J. Dual path networks. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, 4470\u20134478, 2017."},{"key":"325_CR83","unstructured":"Guo, M. H.; Lu, C. Z.; Liu, Z. N.; Cheng, M. M.; Hu, S. M. Visual attention network. arXiv preprint arXiv:2202.09741, 2022."}],"container-title":["Computational Visual Media"],"original-title":[],"link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41095-022-0325-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41095-022-0325-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41095-022-0325-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10750449\/10897694\/10897705.pdf?arnumber=10897705","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T18:38:54Z","timestamp":1762367934000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10897705\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,9]]},"references-count":83,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1007\/s41095-022-0325-1","relation":{},"ISSN":["2096-0662","2096-0433"],"issn-type":[{"value":"2096-0662","type":"electronic"},{"value":"2096-0433","type":"print"}],"subject":[],"published":{"date-parts":[[2023,9]]},"assertion":[{"value":"13 April 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 November 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 March 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration of competing interest"}}]}}