{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T12:52:09Z","timestamp":1773060729023,"version":"3.50.1"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2021,8,2]],"date-time":"2021-08-02T00:00:00Z","timestamp":1627862400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,8,2]],"date-time":"2021-08-02T00:00:00Z","timestamp":1627862400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"name":"National Key R and D Program of China","award":["No.2018YFB1305200"],"award-info":[{"award-number":["No.2018YFB1305200"]}]},{"name":"Science Technology Department of Zhejiang Province","award":["No.LGG19F020010"],"award-info":[{"award-number":["No.LGG19F020010"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Process Lett"],"published-print":{"date-parts":[[2021,12]]},"DOI":"10.1007\/s11063-021-10592-w","type":"journal-article","created":{"date-parts":[[2021,8,2]],"date-time":"2021-08-02T17:02:45Z","timestamp":1627923765000},"page":"4257-4277","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":27,"title":["CT-UNet: Context-Transfer-UNet for Building Segmentation in Remote Sensing Images"],"prefix":"10.1007","volume":"53","author":[{"given":"Sheng","family":"Liu","sequence":"first","affiliation":[]},{"given":"Huanran","family":"Ye","sequence":"additional","affiliation":[]},{"given":"Kun","family":"Jin","sequence":"additional","affiliation":[]},{"given":"Haohao","family":"Cheng","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,8,2]]},"reference":[{"key":"10592_CR1","doi-asserted-by":"crossref","unstructured":"Adiba A, Hajji H, Maatouk M (2019) Transfer learning and u-net for buildings segmentation. In: Proceedings of the new challenges in data sciences: acts of the second conference of the Moroccan classification society, ACM, p\u00a014","DOI":"10.1145\/3314074.3314088"},{"issue":"5","key":"10592_CR2","doi-asserted-by":"publisher","first-page":"3023","DOI":"10.1109\/TGRS.2013.2268736","volume":"52","author":"E Aptoula","year":"2013","unstructured":"Aptoula E (2013) Remote sensing image retrieval with global morphological texture descriptors. IEEE Trans Geosci Remote Sens 52(5):3023\u20133034","journal-title":"IEEE Trans Geosci Remote Sens"},{"issue":"12","key":"10592_CR3","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan V, Kendall A, Cipolla R (2017) Segnet: A deep convolutional encoder\u2013decoder architecture for image segmentation. IEEE Trans Pattern Anal Mach Intell 39(12):2481\u20132495","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10592_CR4","unstructured":"Bahdanau D, Cho K, Bengio Y (2014) Neural machine translation by jointly learning to align and translate. https:\/\/arxiv.org\/abs\/1409.0473"},{"key":"10592_CR5","doi-asserted-by":"crossref","unstructured":"Bischke B, Helber P, Folz J, Borth D, Dengel A (2019) Multi-task learning for segmentation of building footprints with deep neural networks. In: 2019 IEEE international conference on image processing (ICIP), IEEE, pp 1480\u20131484","DOI":"10.1109\/ICIP.2019.8803050"},{"key":"10592_CR6","doi-asserted-by":"crossref","unstructured":"Fourure D, Emonet R, Fromont E, Muselet D, Tremeau A, Wolf C (2017) Residual conv-deconv grid network for semantic segmentation. https:\/\/arxiv.org\/abs\/1707.07958","DOI":"10.5244\/C.31.181"},{"key":"10592_CR7","unstructured":"Glorot X, Bordes A, Bengio Y (2011) Deep sparse rectifier neural networks. In: Proceedings of the fourteenth international conference on artificial intelligence and statistics, pp 315\u2013323"},{"key":"10592_CR8","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"issue":"140305","key":"10592_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.ins.2020.05.045","volume":"63","author":"N He","year":"2020","unstructured":"He N, Fang L, Plaza A (2020) Hybrid first and second order attention unet for building segmentation in remote sensing images. Inf Sci 63(140305):1\u2013140305","journal-title":"Inf Sci"},{"key":"10592_CR10","doi-asserted-by":"crossref","unstructured":"Hu S, Ning Q, Chen B, Lei Y, Zhou X, Yan H, Zhao C, Tang T, Hu R (2020) Segmentation of aerial image with multi-scale feature and attention model. In: Artificial Intelligence in China, Springer, pp 58\u201366","DOI":"10.1007\/978-981-15-0187-6_7"},{"key":"10592_CR11","doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Van Der\u00a0Maaten L, Weinberger KQ (2017) Densely connected convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4700\u20134708","DOI":"10.1109\/CVPR.2017.243"},{"issue":"1","key":"10592_CR12","doi-asserted-by":"publisher","first-page":"574","DOI":"10.1109\/TGRS.2018.2858817","volume":"57","author":"S Ji","year":"2018","unstructured":"Ji S, Wei S, Lu M (2018) Fully convolutional networks for multisource building extraction from an open aerial and satellite imagery data set. IEEE Tran Geosci Remote Sens 57(1):574\u2013586","journal-title":"IEEE Tran Geosci Remote Sens"},{"key":"10592_CR13","unstructured":"Khalel A, El-Saban M (2018) Automatic pixelwise object labeling for aerial imagery using stacked u-nets. https:\/\/arxiv.org\/abs\/1803.04953"},{"issue":"1","key":"10592_CR14","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1109\/LGRS.2018.2868880","volume":"16","author":"JH Kim","year":"2018","unstructured":"Kim JH, Lee H, Hong SJ, Kim S, Park J, Hwang JY, Choi JP (2018) Objects segmentation from high-resolution aerial images using u-net with pyramid pooling layers. IEEE Geosci Remote Sens Lett 16(1):115\u2013119","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"10592_CR15","doi-asserted-by":"publisher","first-page":"128774","DOI":"10.1109\/ACCESS.2019.2940527","volume":"7","author":"Y Liu","year":"2019","unstructured":"Liu Y, Gross L, Li Z, Li X, Fan X, Qi W (2019) Automatic building extraction on high-resolution remote sensing imagery using deep convolutional encoder-decoder with spatial pyramid pooling. IEEE Access 7:128774\u2013128786","journal-title":"IEEE Access"},{"key":"10592_CR16","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"10592_CR17","doi-asserted-by":"crossref","unstructured":"Luong MT, Pham H, Manning CD (2015) Effective approaches to attention-based neural machine translation. https:\/\/arxiv.org\/abs\/1508.04025","DOI":"10.18653\/v1\/D15-1166"},{"key":"10592_CR18","doi-asserted-by":"crossref","unstructured":"Maggiori E, Tarabalka Y, Charpiat G, Alliez P (2017) Can semantic labeling methods generalize to any city? the inria aerial image labeling benchmark. In: 2017 IEEE international geoscience and remote sensing symposium (IGARSS), IEEE, pp 3226\u20133229","DOI":"10.1109\/IGARSS.2017.8127684"},{"issue":"9","key":"10592_CR19","doi-asserted-by":"publisher","first-page":"1067","DOI":"10.1016\/j.patrec.2004.03.004","volume":"25","author":"P Mitra","year":"2004","unstructured":"Mitra P, Shankar BU, Pal SK (2004) Segmentation of multispectral remote sensing images using active support vector machines. Pattern Recogn Lett 25(9):1067\u20131074","journal-title":"Pattern Recogn Lett"},{"key":"10592_CR20","unstructured":"Mnih V (2013) Machine learning for aerial image labeling. Citeseer"},{"key":"10592_CR21","unstructured":"Oktay O, Schlemper J, Folgoc LL, Lee M, Heinrich M, Misawa K, Mori K, McDonagh S, Hammerla NY, Kainz B, et\u00a0al. (2018) Attention u-net: Learning where to look for the pancreas. https:\/\/arxiv.org\/abs\/1804.03999"},{"issue":"1","key":"10592_CR22","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1080\/01431160412331269698","volume":"26","author":"M Pal","year":"2005","unstructured":"Pal M (2005) Random forest classifier for remote sensing classification. Int J Remote Sens 26(1):217\u2013222","journal-title":"Int J Remote Sens"},{"issue":"8","key":"10592_CR23","doi-asserted-by":"publisher","first-page":"917","DOI":"10.3390\/rs11080917","volume":"11","author":"X Pan","year":"2019","unstructured":"Pan X, Yang F, Gao L, Chen Z, Zhang B, Fan H, Ren J (2019) Building extraction from high-resolution aerial imagery using a generative adversarial network with spatial and channel attention mechanisms. Remote Sens 11(8):917","journal-title":"Remote Sens"},{"key":"10592_CR24","unstructured":"Qi HN, Yang JG, Zhong YW, Deng C (2004) Multi-class svm based remote sensing image classification and its semi-supervised improvement scheme. In: Proceedings of 2004 international conference on machine learning and cybernetics (IEEE Cat. No. 04EX826), IEEE, vol\u00a05, pp 3146\u20133151"},{"key":"10592_CR25","doi-asserted-by":"crossref","unstructured":"Ronneberger O, Fischer P, Brox T (2015) U-net: Convolutional networks for biomedical image segmentation. In: International conference on medical image computing and computer-assisted intervention, Springer, pp 234\u2013241","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"10592_CR26","unstructured":"Sebastian C, Imbriaco R, Bondarev E, de\u00a0With PH (2020) Adversarial loss for semantic segmentation of aerial imagery. https:\/\/arxiv.org\/abs\/2001.04269"},{"key":"10592_CR27","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. https:\/\/arxiv.org\/abs\/1409.1556"},{"issue":"3","key":"10592_CR28","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1007\/s12524-012-0241-4","volume":"41","author":"PP Singh","year":"2013","unstructured":"Singh PP, Garg R (2013) Automatic road extraction from high resolution satellite image using adaptive global thresholding and morphological operations. J Ind Soc Remote Sens 41(3):631\u2013640","journal-title":"J Ind Soc Remote Sens"},{"key":"10592_CR29","doi-asserted-by":"crossref","unstructured":"Song L, Xu Y, Zhang L, Du B, Zhang Q, Wang X (2020) Learning from synthetic images via active pseudo-labeling. IEEE Transactions on Image Processing","DOI":"10.1109\/TIP.2020.2989100"},{"issue":"6","key":"10592_CR30","doi-asserted-by":"publisher","first-page":"2327","DOI":"10.1109\/JSTARS.2013.2242846","volume":"6","author":"S Tuermer","year":"2013","unstructured":"Tuermer S, Kurz F, Reinartz P, Stilla U (2013) Airborne vehicle detection in dense urban areas using hog features and disparity maps. IEEE J Select Top Appl Earth Observ Remote Sens 6(6):2327\u20132337","journal-title":"IEEE J Select Top Appl Earth Observ Remote Sens"},{"issue":"1","key":"10592_CR31","doi-asserted-by":"publisher","first-page":"239","DOI":"10.1109\/LGRS.2013.2254108","volume":"11","author":"J Xia","year":"2013","unstructured":"Xia J, Du P, He X, Chanussot J (2013) Hyperspectral remote sensing image classification based on rotation forest. IEEE Geosci Remote Sens Lett 11(1):239\u2013243","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"10592_CR32","unstructured":"Xu K, Ba J, Kiros R, Cho K, Courville A, Salakhudinov R, Zemel R, Bengio Y (2015) Show, attend and tell: Neural image caption generation with visual attention. In: International conference on machine learning, pp 2048\u20132057"},{"issue":"15","key":"10592_CR33","doi-asserted-by":"publisher","first-page":"1774","DOI":"10.3390\/rs11151774","volume":"11","author":"Y Yi","year":"2019","unstructured":"Yi Y, Zhang Z, Zhang W, Zhang C, Li W, Zhao T (2019) Semantic segmentation of urban buildings from VHR remote sensing imagery using a deep convolutional neural network. Remote Sens 11(15):1774","journal-title":"Remote Sens"},{"key":"10592_CR34","doi-asserted-by":"crossref","unstructured":"Yu C, Wang J, Peng C, Gao C, Yu G, Sang N (2018) Learning a discriminative feature network for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1857\u20131866","DOI":"10.1109\/CVPR.2018.00199"},{"issue":"3","key":"10592_CR35","doi-asserted-by":"publisher","first-page":"879","DOI":"10.1109\/TGRS.2011.2162339","volume":"50","author":"L Zhang","year":"2011","unstructured":"Zhang L, Zhang L, Tao D, Huang X (2011) On combining multiple features for hyperspectral remote sensing image classification. IEEE Trans Geosci Remote Sens 50(3):879\u2013893","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"10592_CR36","doi-asserted-by":"crossref","unstructured":"Zhang Y, Gong W, Sun J (1897) Li W (2019) Web-net: A novel nest networks with ultra-hierarchical sampling for building extraction from aerial imageries. Remote Sens 11(16)","DOI":"10.3390\/rs11161897"},{"issue":"5","key":"10592_CR37","doi-asserted-by":"publisher","first-page":"749","DOI":"10.1109\/LGRS.2018.2802944","volume":"15","author":"Z Zhang","year":"2018","unstructured":"Zhang Z, Liu Q, Wang Y (2018) Road extraction by deep residual u-net. IEEE Geosci Remote Sens Lett 15(5):749\u2013753","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"10592_CR38","doi-asserted-by":"crossref","unstructured":"Zhao H, Shi J, Qi X, Wang X, Jia J (2017) Pyramid scene parsing network. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2881\u20132890","DOI":"10.1109\/CVPR.2017.660"},{"key":"10592_CR39","doi-asserted-by":"crossref","unstructured":"Zhao H, Zhang Y, Liu S, Shi J, Change\u00a0Loy C, Lin D, Jia J (2018) Psanet: Point-wise spatial attention network for scene parsing. In: Proceedings of the European conference on computer vision (ECCV), pp 267\u2013283","DOI":"10.1007\/978-3-030-01240-3_17"},{"key":"10592_CR40","doi-asserted-by":"crossref","unstructured":"Zhou Z, Siddiquee MMR, Tajbakhsh N, Liang J (2018) Unet++: A nested u-net architecture for medical image segmentation. In: Deep learning in medical image analysis and multimodal learning for clinical decision support, Springer, pp 3\u201311","DOI":"10.1007\/978-3-030-00889-5_1"}],"container-title":["Neural Processing Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-021-10592-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11063-021-10592-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-021-10592-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,31]],"date-time":"2021-10-31T10:15:28Z","timestamp":1635675328000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11063-021-10592-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,2]]},"references-count":40,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2021,12]]}},"alternative-id":["10592"],"URL":"https:\/\/doi.org\/10.1007\/s11063-021-10592-w","relation":{},"ISSN":["1370-4621","1573-773X"],"issn-type":[{"value":"1370-4621","type":"print"},{"value":"1573-773X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,8,2]]},"assertion":[{"value":"12 July 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 August 2021","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}