{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,11]],"date-time":"2026-05-11T08:09:51Z","timestamp":1778486991350,"version":"3.51.4"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the Major Basic Research Project on Equipment","award":["No.51405-02A03"],"award-info":[{"award-number":["No.51405-02A03"]}]},{"name":"the Science Fund for Creative Research Groups of the National Natural Science Foundation of China,","award":["No. 61921004"],"award-info":[{"award-number":["No. 61921004"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s11554-026-01868-2","type":"journal-article","created":{"date-parts":[[2026,4,5]],"date-time":"2026-04-05T08:43:54Z","timestamp":1775378634000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["PCASeg: progressive cross-layer attention with adaptive sparsity for real-time semantic segmentation"],"prefix":"10.1007","volume":"23","author":[{"given":"Dongpu","family":"Li","sequence":"first","affiliation":[]},{"given":"Xiaosu","family":"Xu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,4,5]]},"reference":[{"issue":"10","key":"1868_CR1","volume":"36","author":"MA Elhassan","year":"2024","unstructured":"Elhassan, M.A., Zhou, C., Khan, A., Benabid, A., Adam, A.B., Mehmood, A., Wambugu, N.: Real-time semantic segmentation for autonomous driving: A review of CNNs, Transformers, and Beyond, Journal of King Saud University-Computer and Information. Sciences 36(10), 102226 (2024)","journal-title":"Sciences"},{"key":"1868_CR2","doi-asserted-by":"crossref","unstructured":"Abdulateef, S.K., Salman, M.D.: A Comprehensive Review of Image Segmentation Techniques., Iraqi Journal for Electrical & Electronic Engineering 17(2) (2021)","DOI":"10.37917\/ijeee.17.2.18"},{"key":"1868_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2024.108832","volume":"219","author":"A Paul","year":"2024","unstructured":"Paul, A., Machavaram, R., Kumar, D., Nagar, H., et al.: Smart solutions for capsicum Harvesting: Unleashing the power of YOLO for Detection, Segmentation, growth stage Classification, Counting, and real-time mobile identification. Comput. Electron. Agric. 219, 108832 (2024)","journal-title":"Comput. Electron. Agric."},{"issue":"6","key":"1868_CR4","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1007\/s10462-024-10775-6","volume":"57","author":"L Lei","year":"2024","unstructured":"Lei, L., Yang, Q., Yang, L., Shen, T., Wang, R., Fu, C.: Deep learning implementation of image segmentation in agricultural applications: a comprehensive review. Artif. Intell. Rev. 57(6), 149 (2024)","journal-title":"Artif. Intell. Rev."},{"issue":"2","key":"1868_CR5","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu, L., Ouyang, W., Wang, X., Fieguth, P., Chen, J., Liu, X., Pietik\u00e4inen, M.: Deep learning for generic object detection: A survey. Int. J. Comput. Vision 128(2), 261 (2020)","journal-title":"Int. J. Comput. Vision"},{"key":"1868_CR6","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation, In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"1868_CR7","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S. et\u00a0al.: An image is worth 16x16 words: Transformers for image recognition at scale, arXiv preprint arXiv:2010.11929 (2020)"},{"key":"1868_CR8","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need, Advances in neural information processing systems 30 (2017)"},{"key":"1868_CR9","doi-asserted-by":"crossref","unstructured":"Zheng, S., Lu, J., Zhao, H., Zhu, X., Luo, Z., Wang, Y., Fu, Y., Feng, J., Xiang, T., Torr, P.H. et\u00a0al.: Rethinking semantic segmentation from a sequence-to-sequence perspective with transformers, In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6881\u20136890 (2021)","DOI":"10.1109\/CVPR46437.2021.00681"},{"key":"1868_CR10","first-page":"12077","volume":"34","author":"E Xie","year":"2021","unstructured":"Xie, E., Wang, W., Yu, Z., Anandkumar, A., Alvarez, J.M., Luo, P.: SegFormer: Simple and efficient design for semantic segmentation with transformers. Adv. Neural. Inf. Process. Syst. 34, 12077 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1868_CR11","unstructured":"Rao, Y., Zhao, W., Tang, Y., Zhou, J., Lim, S., Lu, J.: Hornet: Efficient high-order spatial interactions with recursive gated convolutions. arXiv 2022, arXiv preprint arXiv:2207.14284 (2022)"},{"key":"1868_CR12","doi-asserted-by":"publisher","first-page":"95","DOI":"10.3389\/fnins.2019.00095","volume":"13","author":"A Sengupta","year":"2019","unstructured":"Sengupta, A., Ye, Y., Wang, R., Liu, C., Roy, K.: Going deeper in spiking neural networks: VGG and residual architectures. Front. Neurosci. 13, 95 (2019)","journal-title":"Front. Neurosci."},{"key":"1868_CR13","doi-asserted-by":"crossref","unstructured":"Chen, L.C., Zhu, Y., Papandreou, G., Schroff, F., Adam, H.: Encoder-decoder with atrous separable convolution for semantic image segmentation, In: Proceedings of the European conference on computer vision (ECCV) pp. 801\u2013818 (2018)","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"1868_CR14","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection, In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"1868_CR15","unstructured":"Paszke, A., Chaurasia, A., Kim, S., Culurciello, E.: Enet: A deep neural network architecture for real-time semantic segmentation, arXiv preprint arXiv:1606.02147 (2016)"},{"key":"1868_CR16","doi-asserted-by":"crossref","unstructured":"Zhao, H., Qi, X., Shen, X., Shi, J., Jia, J.: Icnet for real-time semantic segmentation on high-resolution images, In: Proceedings of the European conference on computer vision (ECCV) pp. 405\u2013420 (2018)","DOI":"10.1007\/978-3-030-01219-9_25"},{"key":"1868_CR17","doi-asserted-by":"crossref","unstructured":"Yu, C., Wang, J., Peng, C., Gao, C., Yu, G., Sang, N.: Bisenet: Bilateral segmentation network for real-time semantic segmentation, In: Proceedings of the European conference on computer vision (ECCV), pp. 325\u2013341 (2018)","DOI":"10.1007\/978-3-030-01261-8_20"},{"key":"1868_CR18","doi-asserted-by":"crossref","unstructured":"Xu, J., Xiong, Z., Bhattacharyya, S.: PIDNet: A real-time semantic segmentation network inspired from PID controller. arXiv, arXiv preprint arXiv:2206.02066 (2022)","DOI":"10.1109\/CVPR52729.2023.01871"},{"key":"1868_CR19","volume":"113","author":"Y Chen","year":"2023","unstructured":"Chen, Y., Zhu, X., Li, Y., Wei, Y., Ye, L.: Enhanced semantic feature pyramid network for small object detection. Signal Processing: Image Communication 113, 116919 (2023)","journal-title":"Signal Processing: Image Communication"},{"key":"1868_CR20","unstructured":"Elhassan, M.A., Yang, C., Huang, C., Munea, T.L., Hong, X., Adam, A., Benabid, A.: S$$^{2}$$-FPN: Scale-aware Strip Attention Guided Feature Pyramid Network for Real-time Semantic Segmentation, arXiv preprint arXiv:2206.07298 (2022)"},{"key":"1868_CR21","unstructured":"Liu, X., Peng, H., Zheng, N., Yang, Y., Hu, H., Yuan, Y.: Efficientvit: Memory efficient vision transformer with cascaded group attention, In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 14,420\u201314,430 (2023)"},{"key":"1868_CR22","first-page":"1140","volume":"35","author":"MH Guo","year":"2022","unstructured":"Guo, M.H., Lu, C.Z., Hou, Q., Liu, Z., Cheng, M.M., Hu, S.M.: title=Segnext: Rethinking convolutional attention design for semantic segmentation. Adv. Neural. Inf. Process. Syst. 35, 1140 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1868_CR23","unstructured":"Zhang, W., Huang, Z., Luo, G., Chen, T., Wang, X., Liu, W., Yu, G., Shen, C.: Topformer: Token pyramid transformer for mobile semantic segmentation, In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12,083\u201312,093 (2022)"},{"key":"1868_CR24","unstructured":"Yin, B., Zhang, X., Li, Z., Liu, L., Cheng, M.M., Hou, Q.: Dformer: Rethinking rgbd representation learning for semantic segmentation, arXiv preprint arXiv:2309.09668 (2023)"},{"key":"1868_CR25","doi-asserted-by":"crossref","unstructured":"Yin, B.W., Cao, J.L., Cheng, M.M., Hou, Q.: Dformerv2: Geometry self-attention for rgbd semantic segmentation, In: Proceedings of the Computer Vision and Pattern Recognition Conference, pp. 19,345\u201319,355 (2025)","DOI":"10.1109\/CVPR52734.2025.01802"},{"key":"1868_CR26","doi-asserted-by":"crossref","unstructured":"Jain, J., Li, J., Chiu, M.T., Hassani, A., Orlov, N., Shi, H.: Oneformer: One transformer to rule universal image segmentation, In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2989\u20132998 (2023)","DOI":"10.1109\/CVPR52729.2023.00292"},{"key":"1868_CR27","doi-asserted-by":"crossref","unstructured":"Long, W., Zhou, X., Zhang, L., Gu, S.: Progressive Focused Transformer for Single Image Super-Resolution, In: Proceedings of the Computer Vision and Pattern Recognition Conference, pp. 2279\u20132288 (2025)","DOI":"10.1109\/CVPR52734.2025.00218"},{"issue":"19","key":"1868_CR28","doi-asserted-by":"publisher","first-page":"5934","DOI":"10.3390\/s25195934","volume":"25","author":"L Zhang","year":"2025","unstructured":"Zhang, L., Li, M., Zhang, P., Liu, P.: EfficientSegNet: Lightweight Semantic Segmentation with Multi-Scale Feature Fusion and Boundary Enhancement. Sensors 25(19), 5934 (2025)","journal-title":"Sensors"},{"key":"1868_CR29","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2025.130099","volume":"637","author":"S Jia","year":"2025","unstructured":"Jia, S., Dong, Y., Mao, C., Zheng, L., Li, Y., Liu, K.: Multi-Path Feature Enhancement Network for real-time semantic segmentation. Neurocomputing 637, 130099 (2025)","journal-title":"Neurocomputing"},{"key":"1868_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.cag.2024.104105","volume":"126","author":"L Shen","year":"2025","unstructured":"Shen, L., Cao, Y., Zhu, W., Ren, K., Shou, Y., Wang, H., Xu, Z.: Enhanced multi-scale feature adaptive fusion sparse convolutional network for large-scale scenes semantic segmentation. Computers & Graphics 126, 104105 (2025)","journal-title":"Computers & Graphics"},{"key":"1868_CR31","doi-asserted-by":"crossref","unstructured":"Jiang, Y., Gong, L., Huang, H., Qi, M.: MSF-TransUNet: A Multi-Scale Feature Fusion Transformer-Based U-Net for Medical Image Segmentation with Uniform Attention., Traitement du Signal 42(1) (2025)","DOI":"10.18280\/ts.420145"},{"key":"1868_CR32","doi-asserted-by":"crossref","unstructured":"Chen, X., Li, H., Li, M., Pan, J.: Learning a sparse transformer network for effective image deraining, In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 5896\u20135905 (2023)","DOI":"10.1109\/CVPR52729.2023.00571"},{"key":"1868_CR33","first-page":"17864","volume":"34","author":"B Cheng","year":"2021","unstructured":"Cheng, B., Schwing, A., Kirillov, A.: Per-pixel classification is not all you need for semantic segmentation. Adv. Neural. Inf. Process. Syst. 34, 17864 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1868_CR34","doi-asserted-by":"crossref","unstructured":"Zhou, B., Zhao, H., Puig, X., Fidler, S., Barriuso, A., Torralba, A.: Scene parsing through ade20k dataset, In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 633\u2013641 (2017)","DOI":"10.1109\/CVPR.2017.544"},{"key":"1868_CR35","doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., Ramos, S., Rehfeld, T., Enzweiler, M., Benenson, R., Franke, U., Roth, S., Schiele, B.: The cityscapes dataset for semantic urban scene understanding, In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3213\u20133223 (2016)","DOI":"10.1109\/CVPR.2016.350"},{"issue":"1","key":"1868_CR36","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S.A., Van Gool, L., Williams, C.K., Winn, J., Zisserman, A.: The pascal visual object classes challenge: A retrospective. Int. J. Comput. Vision 111(1), 98 (2015)","journal-title":"Int. J. Comput. Vision"},{"key":"1868_CR37","unstructured":"Contributors, M.: Mmsegmentation: Openmmlab semantic segmentation toolbox and benchmark (2020)"},{"key":"1868_CR38","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., Guo, B.: Swin transformer: Hierarchical vision transformer using shifted windows, In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 10,012\u201310,022 (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"1868_CR39","doi-asserted-by":"crossref","unstructured":"Wang, H., Jiang, X., Ren, H., Hu, Y., Bai, S.: Swiftnet: Real-time video object segmentation, In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1296\u20131305 (2021)","DOI":"10.1109\/CVPR46437.2021.00135"},{"key":"1868_CR40","doi-asserted-by":"crossref","unstructured":"Li, X., You, A., Zhu, Z., Zhao, H., Yang, M., Yang, K., Tan, S., Tong, Y.: Semantic flow for fast and accurate scene parsing, In: European conference on computer vision Springer, (2020), pp. 775\u2013793","DOI":"10.1007\/978-3-030-58452-8_45"},{"key":"1868_CR41","doi-asserted-by":"crossref","unstructured":"Kumaar, S., Lyu, Y., Nex, F., Yang, M.Y.: Cabinet: Efficient context aggregation network for low-latency semantic segmentation, In: 2021 IEEE International Conference on Robotics and Automation (ICRA), IEEE, pp. 13,517\u201313,524 (2021)","DOI":"10.1109\/ICRA48506.2021.9560977"},{"key":"1868_CR42","doi-asserted-by":"crossref","unstructured":"Strudel, R., Garcia, R., Laptev, I., Schmid, C.: Segmenter: Transformer for semantic segmentation, In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 7262\u20137272 (2021)","DOI":"10.1109\/ICCV48922.2021.00717"},{"issue":"3","key":"1868_CR43","doi-asserted-by":"publisher","first-page":"3448","DOI":"10.1109\/TITS.2022.3228042","volume":"24","author":"H Pan","year":"2022","unstructured":"Pan, H., Hong, Y., Sun, W., Jia, Y.: Deep dual-resolution networks for real-time and accurate semantic segmentation of traffic scenes. IEEE Trans. Intell. Transp. Syst. 24(3), 3448 (2022)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"1868_CR44","first-page":"7423","volume":"35","author":"J Wang","year":"2022","unstructured":"Wang, J., Gou, C., Wu, Q., Feng, H., Han, J., Ding, E., Wang, J.: RTFormer: Efficient design for real-time semantic segmentation with transformer. Adv. Neural. Inf. Process. Syst. 35, 7423 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1868_CR45","doi-asserted-by":"publisher","first-page":"516","DOI":"10.1609\/aaai.v37i1.25126","volume":"37","author":"B Dong","year":"2023","unstructured":"Dong, B., Wang, P., Wang, F.: Head-free lightweight semantic segmentation with linear transformer. Proceedings of the AAAI conference on artificial intelligence 37, 516\u2013524 (2023)","journal-title":"Proceedings of the AAAI conference on artificial intelligence"},{"issue":"7","key":"1868_CR46","doi-asserted-by":"publisher","first-page":"4318","DOI":"10.1109\/TSMC.2024.3377280","volume":"54","author":"X Peng","year":"2024","unstructured":"Peng, X., Cheng, J., Tang, X., Deng, Z., Tu, W., Xiong, N.: Hsnet: an intelligent hierarchical semantic-aware network system for real-time semantic segmentation. IEEE Transactions on Systems, Man, and Cybernetics: Systems 54(7), 4318 (2024)","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics: Systems"},{"key":"1868_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.124610","volume":"255","author":"MA Elhassan","year":"2024","unstructured":"Elhassan, M.A., Zhou, C., Benabid, A., Adam, A.B.: P2AT: Pyramid pooling axial transformer for real-time semantic segmentation. Expert Syst. Appl. 255, 124610 (2024)","journal-title":"Expert Syst. Appl."},{"key":"1868_CR48","doi-asserted-by":"publisher","first-page":"6378","DOI":"10.1609\/aaai.v38i6.28457","volume":"38","author":"Z Xu","year":"2024","unstructured":"Xu, Z., Wu, D., Yu, C., Chu, X., Sang, N., Gao, C.: Sctnet: Single-branch cnn with transformer semantic information for real-time segmentation. Proceedings of the AAAI conference on artificial intelligence 38, 6378\u20136386 (2024)","journal-title":"Proceedings of the AAAI conference on artificial intelligence"},{"key":"1868_CR49","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2025.129489","volume":"625","author":"Y Gu","year":"2025","unstructured":"Gu, Y., Fu, C., Song, W., Wang, X., Chen, J.: RTLinearFormer: Semantic segmentation with lightweight linear attentions. Neurocomputing 625, 129489 (2025)","journal-title":"Neurocomputing"},{"key":"1868_CR50","doi-asserted-by":"crossref","unstructured":"Zhao, H., Shi, J., Qi, X., Wang, X., Jia, J.: Pyramid scene parsing network, In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2881\u20132890 (2017)","DOI":"10.1109\/CVPR.2017.660"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-026-01868-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-026-01868-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-026-01868-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,11]],"date-time":"2026-05-11T07:31:55Z","timestamp":1778484715000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-026-01868-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":50,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["1868"],"URL":"https:\/\/doi.org\/10.1007\/s11554-026-01868-2","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]},"assertion":[{"value":"8 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 March 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 April 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"All the authors declare that they have no competing financial interests or personal relationships that could influence the work reported in this paper. The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain studies with human participants or animals. Statement of informed consent is not applicable since the manuscript does not contain any patient data.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}],"article-number":"84"}}