{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,26]],"date-time":"2026-04-26T04:46:52Z","timestamp":1777178812923,"version":"3.51.4"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"18","license":[{"start":{"date-parts":[[2023,3,13]],"date-time":"2023-03-13T00:00:00Z","timestamp":1678665600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,3,13]],"date-time":"2023-03-13T00:00:00Z","timestamp":1678665600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100014718","name":"Innovative Research Group Project of the National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61976105"],"award-info":[{"award-number":["61976105"]}],"id":[{"id":"10.13039\/100014718","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Postgraduate Research & Practice Innovation Program of Jiangsu Province","award":["KYCX22_2342"],"award-info":[{"award-number":["KYCX22_2342"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s11042-023-14958-1","type":"journal-article","created":{"date-parts":[[2023,3,13]],"date-time":"2023-03-13T09:02:46Z","timestamp":1678698166000},"page":"28427-28444","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["A semantic segmentation algorithm for fashion images based on modified mask RCNN"],"prefix":"10.1007","volume":"82","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3928-4170","authenticated-orcid":false,"given":"Wentao","family":"He","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jing\u2019an","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lei","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruru","family":"Pan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Weidong","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,3,13]]},"reference":[{"key":"14958_CR1","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1016\/j.eswa.2019.01.010","volume":"122","author":"M Arsalan","year":"2019","unstructured":"Arsalan M, Kim DS, Lee MB, Owais M, Park KR (2019) FRED-Net: fully residual encoder\u2013decoder network for accurate iris segmentation. Expert Syst Appl 122:217\u2013241. https:\/\/doi.org\/10.1016\/j.eswa.2019.01.010","journal-title":"Expert Syst Appl"},{"issue":"12","key":"14958_CR2","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan V, Kendall A, Cipolla R (2017) Segnet: a deep convolutional encoder-decoder architecture for image segmentation. IEEE Trans Pattern Anal Mach Intell 39(12):2481\u20132495. https:\/\/doi.org\/10.1109\/TPAMI.2016.2644615","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"2","key":"14958_CR3","doi-asserted-by":"publisher","first-page":"1081","DOI":"10.1007\/s11063-019-10129-2","volume":"51","author":"Y Chen","year":"2020","unstructured":"Chen Y, Hu H (2020) Multi-layer adaptive feature fusion for semantic segmentation. Neural Process Lett 51(2):1081\u20131092. https:\/\/doi.org\/10.1007\/s11063-019-10129-2","journal-title":"Neural Process Lett"},{"key":"14958_CR4","doi-asserted-by":"publisher","unstructured":"Chen L-C, Papandreou G, Kokkinos I, Murphy K, Yuille AL (2014) Semantic image segmentation with deep convolutional nets and fully connected crfs. arXiv Prepr. arXiv1412.7062. https:\/\/doi.org\/10.48550\/arXiv.1412.7062","DOI":"10.48550\/arXiv.1412.7062"},{"key":"14958_CR5","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2938758","author":"S Gao","year":"2019","unstructured":"Gao S, Cheng M-M, Zhao K, Zhang X-Y, Yang M-H, Torr PHS (2019) Res2net: a new multi-scale backbone architecture. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2019.2938758","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"14958_CR6","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1016\/j.asoc.2018.05.018","volume":"70","author":"A Garcia-Garcia","year":"2018","unstructured":"Garcia-Garcia A, Orts-Escolano S, Oprea S, Villena-Martinez V, Martinez-Gonzalez P, Garcia-Rodriguez J (2018) A survey on deep learning techniques for image and video semantic segmentation. Appl Soft Comput 70:41\u201365. https:\/\/doi.org\/10.1016\/j.asoc.2018.05.018","journal-title":"Appl Soft Comput"},{"key":"14958_CR7","doi-asserted-by":"publisher","unstructured":"Gong K, Liang X, Zhang D, Shen X, Lin L (2017) Look into person: self-supervised structure-sensitive learning and a new benchmark for human parsing. Proc. \u2013 30th IEEE Conf. Comput. Vis. Pattern Recognition, CVPR 2017, vol 2017-Janua, pp 6757\u20136765. https:\/\/doi.org\/10.1109\/CVPR.2017.715","DOI":"10.1109\/CVPR.2017.715"},{"key":"14958_CR8","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"issue":"2","key":"14958_CR9","doi-asserted-by":"publisher","first-page":"386","DOI":"10.1109\/TPAMI.2018.2844175","volume":"42","author":"K He","year":"2020","unstructured":"He K, Gkioxari G, Doll\u00e1r P, Girshick R (2020) Mask R-CNN. IEEE Trans Pattern Anal Mach Intell 42(2):386\u2013397. https:\/\/doi.org\/10.1109\/TPAMI.2018.2844175","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"8","key":"14958_CR10","doi-asserted-by":"publisher","first-page":"1565","DOI":"10.3390\/rs13081565","volume":"13","author":"J Kwak","year":"2021","unstructured":"Kwak J, Sung Y (2021) DeepLabV3-Refiner-based semantic segmentation model for dense 3D point clouds. Remote Sens 13(8):1565. https:\/\/doi.org\/10.3390\/rs13081565","journal-title":"Remote Sens"},{"issue":"7","key":"14958_CR11","doi-asserted-by":"publisher","first-page":"616","DOI":"10.1111\/mice.12433","volume":"34","author":"S Li","year":"2019","unstructured":"Li S, Zhao X, Zhou G (2019) Automatic pixel-level multiple damage detection of concrete structure using fully convolutional network. Comput Civ Infrastruct Eng 34(7):616\u2013634. https:\/\/doi.org\/10.1111\/mice.12433","journal-title":"Comput Civ Infrastruct Eng"},{"issue":"1","key":"14958_CR12","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1109\/TMM.2013.2285526","volume":"16","author":"S Liu","year":"2013","unstructured":"Liu S et al (2013) Fashion parsing with weak color-category labels. IEEE Trans Multimed 16(1):253\u2013265. https:\/\/doi.org\/10.1109\/TMM.2013.2285526","journal-title":"IEEE Trans Multimed"},{"key":"14958_CR13","doi-asserted-by":"crossref","unstructured":"Liu Z, Luo P, Qiu S, Wang X, Tang X (2016) Deepfashion: powering robust clothes recognition and retrieval with rich annotations. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1096\u20131104","DOI":"10.1109\/CVPR.2016.124"},{"key":"14958_CR14","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"14958_CR15","doi-asserted-by":"publisher","DOI":"10.1007\/s11063-020-10368-8","author":"S Mehmood","year":"2020","unstructured":"Mehmood S, Shahzad M, Fraz MM (2020) Deep context aware recurrent neural network for semantic segmentation of large scale unstructured 3D point cloud. Neural Process Lett. https:\/\/doi.org\/10.1007\/s11063-020-10368-8","journal-title":"Neural Process Lett"},{"key":"14958_CR16","doi-asserted-by":"publisher","unstructured":"Paszke A, Chaurasia A, Kim S, Culurciello E (2016) Enet: a deep neural network architecture for real-time semantic segmentation. arXiv Prepr. arXiv1606.02147. https:\/\/doi.org\/10.48550\/arXiv.1606.02147","DOI":"10.48550\/arXiv.1606.02147"},{"issue":"1","key":"14958_CR17","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1007\/s12518-020-00331-6","volume":"13","author":"G Pavoni","year":"2021","unstructured":"Pavoni G, Corsini M, Pedersen N, Petrovic V, Cignoni P (2021) Challenges in the deep learning-based semantic segmentation of benthic communities from Ortho-images. Appl Geomat 13(1):131\u2013146. https:\/\/doi.org\/10.1007\/s12518-020-00331-6","journal-title":"Appl Geomat"},{"issue":"24","key":"14958_CR18","doi-asserted-by":"publisher","first-page":"11517","DOI":"10.1007\/s11042-014-2249-y","volume":"74","author":"P Razzaghi","year":"2015","unstructured":"Razzaghi P, Samavi S (2015) Image retargeting using nonparametric semantic segmentation. Multimed Tools Appl 74(24):11517\u201311536. https:\/\/doi.org\/10.1007\/s11042-014-2249-y","journal-title":"Multimed Tools Appl"},{"key":"14958_CR19","first-page":"91","volume":"28","author":"S Ren","year":"2015","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: towards real-time object detection with region proposal networks. Adv Neural Inf Process Syst 28:91\u201399","journal-title":"Adv Neural Inf Process Syst"},{"key":"14958_CR20","doi-asserted-by":"publisher","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv Prepr. arXiv1409.1556. https:\/\/doi.org\/10.48550\/arXiv.1409.1556","DOI":"10.48550\/arXiv.1409.1556"},{"key":"14958_CR21","doi-asserted-by":"publisher","unstructured":"Xia F, Wang P, Chen X, Yuille A (2017) Joint multi-person pose estimation and semantic part segmentation. Proc. \u2013 30th IEEE Conf. Comput. Vis. Pattern Recognition, CVPR 2017, vol 2017-Janua, pp 6080\u20136089. https:\/\/doi.org\/10.1109\/CVPR.2017.644","DOI":"10.1109\/CVPR.2017.644"},{"key":"14958_CR22","doi-asserted-by":"publisher","unstructured":"Yu F, Koltun V (2015) Multi-scale context aggregation by dilated convolutions. arXiv Prepr. arXiv1511.07122. https:\/\/doi.org\/10.48550\/arXiv.1511.07122","DOI":"10.48550\/arXiv.1511.07122"},{"issue":"3","key":"14958_CR23","first-page":"435","volume":"45","author":"Q Zhang","year":"2018","unstructured":"Zhang Q, Yang M, Kpalma K, Zheng Q, Zhang X (2018) Segmentation of hand posture against complex backgrounds based on saliency and skin colour detection. IAENG Int J Comput Sci 45(3):435\u2013444","journal-title":"IAENG Int J Comput Sci"},{"issue":"4","key":"14958_CR24","doi-asserted-by":"publisher","first-page":"435","DOI":"10.3390\/e23040435","volume":"23","author":"X Zhang","year":"2021","unstructured":"Zhang X, Yang Y, Li Z, Ning X, Qin Y, Cai W (2021) An improved encoder-decoder network based on strip pool method applied to segmentation of farmland vacancy field. Entropy 23(4):435. https:\/\/doi.org\/10.3390\/e23040435","journal-title":"Entropy"},{"key":"14958_CR25","doi-asserted-by":"publisher","unstructured":"Zhu B, Chen Y, Tang M, Wang J (2018) Progressive cognitive human parsing. 32nd AAAI Conf. Artif. Intell. AAAI 2018, pp 7607\u20137614. https:\/\/doi.org\/10.1609\/aaai.v32i1.12336","DOI":"10.1609\/aaai.v32i1.12336"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-14958-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-14958-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-14958-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,27]],"date-time":"2023-06-27T09:40:20Z","timestamp":1687858820000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-14958-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,13]]},"references-count":25,"journal-issue":{"issue":"18","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["14958"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-14958-1","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,3,13]]},"assertion":[{"value":"5 April 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 October 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 February 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 March 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Data sharing is not applicable to this article, as no new data were created or analyzed in this study.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Data sharing"}},{"value":"Wentao He, Jing\u2019an Wang, Lei Wang, Ruru Pan* and Weidong Gao declare that they have no conflict of interest.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}