{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,12]],"date-time":"2026-07-12T02:31:39Z","timestamp":1783823499481,"version":"3.55.0"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T00:00:00Z","timestamp":1770076800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T00:00:00Z","timestamp":1770076800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the Natural Science Foundation of Shandong Province China","award":["No.ZR2022MF292"],"award-info":[{"award-number":["No.ZR2022MF292"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s00530-026-02215-y","type":"journal-article","created":{"date-parts":[[2026,2,3]],"date-time":"2026-02-03T10:11:50Z","timestamp":1770113510000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["DT-Net: a hybrid framework of DCNN and transformer for medical image segmentation"],"prefix":"10.1007","volume":"32","author":[{"given":"Xiaoyun","family":"Lu","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chunjie","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Lu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ziyun","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,2,3]]},"reference":[{"key":"2215_CR1","doi-asserted-by":"publisher","first-page":"119475","DOI":"10.1016\/j.eswa.2022.119475","volume":"216","author":"Z Ullah","year":"2023","unstructured":"Ullah, Z., Usman, M., Gwak, J.: MTSS-AAE: Multi-task semi-supervised adversarial autoencoding for COVID-19 detection based on chest X-ray images[J]. Expert Syst. Appl. 216, 119475 (2023)","journal-title":"Expert Syst. Appl."},{"key":"2215_CR2","doi-asserted-by":"publisher","first-page":"33687","DOI":"10.1109\/ACCESS.2024.3372394","volume":"12","author":"G Sun","year":"2024","unstructured":"Sun, G., Shu, H., Shao, F., et al.: Fkd-med: Privacy-aware, communication-optimized medical image segmentation via federated learning and model lightweighting through knowledge distillation[J]. Ieee Access. 12, 33687\u201333704 (2024)","journal-title":"Ieee Access."},{"issue":"1","key":"2215_CR3","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1038\/s41598-022-27266-9","volume":"13","author":"Z Ullah","year":"2023","unstructured":"Ullah, Z., Usman, M., Latif, S., et al.: Densely attention mechanism based network for COVID-19 detection in chest X-rays[J]. Sci. Rep. 13(1), 261 (2023)","journal-title":"Sci. Rep."},{"issue":"1","key":"2215_CR4","doi-asserted-by":"publisher","first-page":"9087","DOI":"10.1038\/s41598-023-36311-0","volume":"13","author":"Z Ullah","year":"2023","unstructured":"Ullah, Z., Usman, M., Latif, S., et al.: SSMD-UNet: Semi-supervised multi-task decoders network for diabetic retinopathy segmentation[J]. Sci. Rep. 13(1), 9087 (2023)","journal-title":"Sci. Rep."},{"key":"2215_CR5","doi-asserted-by":"publisher","first-page":"1398237","DOI":"10.3389\/fbioe.2024.1398237","volume":"12","author":"G Sun","year":"2024","unstructured":"Sun, G., Pan, Y., Kong, W., et al.: DA-TransUNet: Integrating Spatial and channel dual attention with transformer U-net for medical image segmentation[J]. Front. Bioeng. Biotechnol. 12, 1398237 (2024)","journal-title":"Front. Bioeng. Biotechnol."},{"key":"2215_CR6","doi-asserted-by":"publisher","first-page":"111854","DOI":"10.1016\/j.knosys.2024.111854","volume":"297","author":"S Ahmad","year":"2024","unstructured":"Ahmad, S., Ullah, Z., Gwak, J.: Multi-teacher cross-modal distillation with cooperative deep supervision fusion learning for unimodal segmentation[J]. Knowl. Based Syst. 297, 111854 (2024)","journal-title":"Knowl. Based Syst."},{"key":"2215_CR7","doi-asserted-by":"publisher","first-page":"1504249","DOI":"10.3389\/fbioe.2024.1504249","volume":"12","author":"Y Pan","year":"2024","unstructured":"Pan, Y., Xin, J., Yang, T., et al.: A mutual inclusion mechanism for precise boundary segmentation in medical images[J]. Front. Bioeng. Biotechnol. 12, 1504249 (2024)","journal-title":"Front. Bioeng. Biotechnol."},{"key":"2215_CR8","doi-asserted-by":"publisher","first-page":"1541","DOI":"10.1016\/j.ins.2022.07.044","volume":"608","author":"Z Ullah","year":"2022","unstructured":"Ullah, Z., Usman, M., Jeon, M., et al.: Cascade multiscale residual attention Cnns with adaptive roi for automatic brain tumor segmentation[J]. Inf. Sci. 608, 1541\u20131556 (2022)","journal-title":"Inf. Sci."},{"key":"2215_CR9","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. : 3431\u20133440. (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"2215_CR10","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: Convolutional networks for biomedical image segmentation[C]\/\/Medical image computing and computer-assisted intervention\u2013MICCAI 2015: 18th international conference, Munich, Germany, October 5\u20139, 2015, proceedings, part III 18. Springer International Publishing, : 234\u2013241. (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"2215_CR11","doi-asserted-by":"crossref","unstructured":"Zhou, Z., Rahman Siddiquee, M.M., Tajbakhsh, N., et al.: Unet++: A nested u-net architecture for medical image segmentation[C]\/\/Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support: 4th International Workshop, DLMIA 2018, and 8th International Workshop, ML-CDS 2018, Held in Conjunction with MICCAI 2018, Granada, Spain, September 20, Proceedings 4. Springer International Publishing, 2018: 3\u201311. (2018)","DOI":"10.1007\/978-3-030-00889-5_1"},{"key":"2215_CR12","doi-asserted-by":"crossref","unstructured":"Huang, H., Lin, L., Tong, R., et al.: Unet 3+: A full-scale connected unet for medical image segmentation[C]\/\/ICASSP 2020\u20132020 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, : 1055\u20131059. (2020)","DOI":"10.1109\/ICASSP40776.2020.9053405"},{"key":"2215_CR13","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., et al.: Deep residual learning for image recognition[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. : 770\u2013778. (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"2215_CR14","unstructured":"Chen, J., Lu, Y., Yu, Q., et al.: Transunet: Transformers make strong encoders for medical image segmentation[J]. (2021). arXiv preprint arXiv:2102.04306"},{"key":"2215_CR15","doi-asserted-by":"crossref","unstructured":"Cao, H., Wang, Y., Chen, J., et al.: Swin-unet: Unet-like pure transformer for medical image segmentation[C]\/\/European conference on computer vision. Cham: Springer Nature Switzerland, : 205\u2013218. (2022)","DOI":"10.1007\/978-3-031-25066-8_9"},{"key":"2215_CR16","doi-asserted-by":"publisher","first-page":"104791","DOI":"10.1016\/j.bspc.2023.104791","volume":"84","author":"H Xiao","year":"2023","unstructured":"Xiao, H., Li, L., Liu, Q., et al.: Transformers in medical image segmentation: A review[J]. Biomed. Signal Process. Control. 84, 104791 (2023)","journal-title":"Biomed. Signal Process. Control"},{"key":"2215_CR17","doi-asserted-by":"publisher","first-page":"105605","DOI":"10.1016\/j.bspc.2023.105605","volume":"88","author":"H Tang","year":"2024","unstructured":"Tang, H., Chen, Y., Wang, T., et al.: HTC-Net: A hybrid CNN-transformer framework for medical image segmentation[J]. Biomed. Signal Process. Control. 88, 105605 (2024)","journal-title":"Biomed. Signal Process. Control"},{"key":"2215_CR18","doi-asserted-by":"publisher","first-page":"112742","DOI":"10.1016\/j.engappai.2025.112742","volume":"162","author":"Z Ullah","year":"2025","unstructured":"Ullah, Z., Kim, J.: Anatomically accurate cardiac segmentation using dense associative Networks[J]. Eng. Appl. Artif. Intell. 162, 112742 (2025)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"2215_CR19","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., et al.: An image is worth 16x16 words: Transformers for image recognition at scale[J]. arXiv preprint arXiv:2010.11929, 2020."},{"key":"2215_CR20","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., et al.: Swin transformer: Hierarchical vision transformer using shifted windows[C]\/\/Proceedings of the IEEE\/CVF international conference on computer vision. : 10012\u201310022. (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2215_CR21","doi-asserted-by":"publisher","DOI":"10.1109\/TMI.2023.3264513","author":"A He","year":"2023","unstructured":"He, A., Wang, K., Li, T., et al.: H2Former: An efficient hierarchical hybrid transformer for medical image segmentation. IEEE Transactions on Medical Imaging (2023). https:\/\/doi.org\/10.1109\/TMI.2023.3264513","journal-title":"IEEE Transactions on Medical Imaging"},{"key":"2215_CR22","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., et al.: Rethinking the inception architecture for computer vision[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. : 2818\u20132826. (2016)","DOI":"10.1109\/CVPR.2016.308"},{"key":"2215_CR23","doi-asserted-by":"crossref","unstructured":"Xiao, X., Lian, S., Luo, Z., et al.: Weighted res-unet for high-quality retina vessel segmentation[C]\/\/2018 9th international conference on information technology in medicine and education (ITME). IEEE, : 327\u2013331. (2018)","DOI":"10.1109\/ITME.2018.00080"},{"issue":"12","key":"2215_CR24","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan, V., Kendall, A., Cipolla, R.: Segnet: A deep convolutional encoder-decoder architecture for image segmentation. IEEE transactions on pattern analysis and machine intelligence 39(12), 2481\u20132495 (2017)","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2215_CR25","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, S., Van der Maaten, L., et al.: Condensenet: An efficient densenet using learned group convolutions[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. : 2752\u20132761. (2018)","DOI":"10.1109\/CVPR.2018.00291"},{"key":"2215_CR26","unstructured":"Tan, M., Le, Q., Efficientnet: Rethinking model scaling for convolutional neural networks[C]\/\/International conference on machine learning. PMLR, : 6105\u20136114. (2019)"},{"key":"2215_CR27","doi-asserted-by":"crossref","unstructured":"\u00c7i\u00e7ek, \u00d6., Abdulkadir, A., Lienkamp, S.S., et al.: 3D U-Net: learning dense volumetric segmentation from sparse annotation[C]\/\/Medical Image Computing and Computer-Assisted Intervention\u2013MICCAI 2016: 19th International Conference, Athens, Greece, October 17\u201321, 2016, Proceedings, Part II 19. Springer International Publishing, : 424\u2013432. (2016)","DOI":"10.1007\/978-3-319-46723-8_49"},{"key":"2215_CR28","doi-asserted-by":"crossref","unstructured":"Milletari, F., Navab, N., Ahmadi, S.A.: V-net: Fully convolutional neural networks for volumetric medical image segmentation[C]\/\/2016 fourth international conference on 3D vision (3DV). Ieee, : 565\u2013571. (2016)","DOI":"10.1109\/3DV.2016.79"},{"issue":"9","key":"2215_CR29","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He, K., Zhang, X., Ren, S., et al.: Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE transactions on pattern analysis and machine intelligence 37(9), 1904\u20131916 (2015)","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"issue":"4","key":"2215_CR30","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2017","unstructured":"Chen, L.C., Papandreou, G., Kokkinos, I., et al.: Deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs[J]. IEEE Trans. Pattern Anal. Mach. Intell. 40(4), 834\u2013848 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2215_CR31","doi-asserted-by":"crossref","unstructured":"Yang, M., Yu, K., Zhang, C., et al.: Denseaspp for semantic segmentation in street scenes[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. : 3684\u20133692. (2018)","DOI":"10.1109\/CVPR.2018.00388"},{"issue":"10","key":"2215_CR32","doi-asserted-by":"publisher","first-page":"3008","DOI":"10.1109\/TMI.2020.2983721","volume":"39","author":"S Feng","year":"2020","unstructured":"Feng, S., Zhao, H., Shi, F., et al.: CPFNet: Context pyramid fusion network for medical image segmentation[J]. IEEE Trans. Med. Imaging. 39(10), 3008\u20133018 (2020)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"2215_CR33","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., et al.: Imagenet: A large-scale hierarchical image database[C]\/\/2009 IEEE conference on computer vision and pattern recognition. Ieee, : 248\u2013255. (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2215_CR34","doi-asserted-by":"crossref","unstructured":"Chen, L.C., Papandreou, G., Schroff, F., et al.: Rethinking atrous Convolution for semantic image segmentation[J]. (2017). arXiv preprint arXiv:1706.05587","DOI":"10.1007\/978-3-030-01234-2_49"},{"issue":"7","key":"2215_CR35","doi-asserted-by":"publisher","first-page":"1597","DOI":"10.1109\/TMI.2018.2791488","volume":"37","author":"H Fu","year":"2018","unstructured":"Fu, H., Cheng, J., Xu, Y., et al.: Joint optic disc and cup segmentation based on multi-label deep network and Polar transformation[J]. IEEE Trans. Med. Imaging. 37(7), 1597\u20131605 (2018)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"2215_CR36","doi-asserted-by":"crossref","unstructured":"Gehlot, S., Gupta, A.: Self-supervision based dual-transformation learning for stain normalization, classification and segmentation[C]\/\/Machine Learning in Medical Imaging: 12th International Workshop, MLMI 2021, Held in Conjunction with MICCAI 2021, Strasbourg, France, September 27, 2021, Proceedings 12. Springer International Publishing, : 477\u2013486. (2021)","DOI":"10.1007\/978-3-030-87589-3_49"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-026-02215-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-026-02215-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-026-02215-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T11:35:48Z","timestamp":1775129748000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-026-02215-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,3]]},"references-count":36,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["2215"],"URL":"https:\/\/doi.org\/10.1007\/s00530-026-02215-y","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,3]]},"assertion":[{"value":"31 December 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"142"}}