{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,11]],"date-time":"2026-05-11T12:39:46Z","timestamp":1778503186171,"version":"3.51.4"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2025,4,1]],"date-time":"2025-04-01T00:00:00Z","timestamp":1743465600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,4,1]],"date-time":"2025-04-01T00:00:00Z","timestamp":1743465600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"\u56fd\u5bb6\u81ea\u7136\u79d1\u5b66\u57fa\u91d1\uff08\u9762\u4e0a\uff09\uff1a\u300a\u673a\u5668\u4eba\u5316\u667a\u80fd\u5236\u5b54\u5200\u5177\u4fdd\u8d28\u52a0\u5de5\u5bff\u547d\u591a\u6a21\u6001\u611f\u77e5\u4e0e\u52a8\u6001\u8bca\u65ad\u5173\u952e\u6280\u672f\u300b","award":["52275407"],"award-info":[{"award-number":["52275407"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2025,4]]},"DOI":"10.1007\/s11554-025-01668-0","type":"journal-article","created":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:09:34Z","timestamp":1743898174000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["PSC-YOLO: a lightweight model for urban road instance segmentation"],"prefix":"10.1007","volume":"22","author":[{"given":"Xiaolin","family":"Gu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guofeng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,4,5]]},"reference":[{"key":"1668_CR1","volume-title":"YOLACT++ Better Real-Time Instance Segmentation","author":"C Zhou","year":"2020","unstructured":"Zhou, C.: YOLACT++ Better Real-Time Instance Segmentation. University of California, Davis (2020)"},{"key":"1668_CR2","first-page":"17721","volume":"33","author":"X Wang","year":"2020","unstructured":"Wang, X., Zhang, R., Kong, T., et al.: Solov2: Dynamic and fast instance segmentation[J]. Advances in Neural information processing systems 33, 17721\u201317732 (2020)","journal-title":"Advances in Neural information processing systems"},{"key":"1668_CR3","doi-asserted-by":"crossref","unstructured":"Varghese, R., Sambath, M.: YOLOv8: a novel object detection algorithm with enhanced performance and robustness. In: 2024 International Conference on Advances in Data Engineering and Intelligent Computing Systems (ADICS), pp. 1\u20136. IEEE (2024)","DOI":"10.1109\/ADICS58448.2024.10533619"},{"issue":"10","key":"1668_CR4","doi-asserted-by":"publisher","DOI":"10.1088\/1361-6501\/ad5b10","volume":"35","author":"W Xia","year":"2024","unstructured":"Xia, W., Li, P., Li, Q., et al.: TTIS-YOLO: a traffic target instance segmentation paradigm for complex road scenarios. Meas. Sci. Technol. 35(10), 105402 (2024)","journal-title":"Meas. Sci. Technol."},{"key":"1668_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2025.129578","volume":"625","author":"KI Rashid","year":"2025","unstructured":"Rashid, K.I., Yang, C.: ViT-CAPS: vision transformer with contrastive adaptive prompt segmentation. Neurocomputing 625, 129578 (2025)","journal-title":"Neurocomputing"},{"key":"1668_CR6","doi-asserted-by":"crossref","unstructured":"Sandler, M., Howard, A., Zhu, M., et al.: MobileNetV2: inverted residuals and linear bottlenecks. Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4510\u20134520 (2018)","DOI":"10.1109\/CVPR.2018.00474"},{"issue":"12","key":"1668_CR7","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan, V., Kendall, A., Cipolla, R.: SegNet: a deep convolutional encoder-decoder architecture for image segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 39(12), 2481\u20132495 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1668_CR8","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Medical Image Computing and Computer-Assisted Intervention-MICCAI (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"1668_CR9","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Arbel\u00e1ez, P., Girshick, R., et al.: Simultaneous detection and segmentation. In: Computer Vision-ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6\u201312 (2014)","DOI":"10.1007\/978-3-319-10584-0_20"},{"key":"1668_CR10","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., et al.: Mask R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"issue":"6","key":"1668_CR11","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren, S., He, K., Girshick, R., et al.: Faster R-CNN: towards real-time object detection with region proposal networks. IEEE Trans. Pattern Anal. Mach. Intell. 39(6), 1137\u20131149 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1668_CR12","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., et al.: Path aggregation network for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"key":"1668_CR13","doi-asserted-by":"crossref","unstructured":"Cheng, T., Wang, X., Huang, L., et al.: Boundary-preserving mask R-CNN. In: Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIV 16. Springer International Publishing, pp. 660\u2013676 (2020)","DOI":"10.1007\/978-3-030-58568-6_39"},{"key":"1668_CR14","doi-asserted-by":"crossref","unstructured":"Bolya, D., Zhou, C., Xiao, F., et al.: YOLACT: real-time instance segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9157\u20139166 (2019)","DOI":"10.1109\/ICCV.2019.00925"},{"key":"1668_CR15","doi-asserted-by":"crossref","unstructured":"Wang, X., Kong, T., Shen, C., et al.: SOLO: segmenting objects by locations. In: Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328 (2020)","DOI":"10.1007\/978-3-030-58523-5_38"},{"key":"1668_CR16","doi-asserted-by":"crossref","unstructured":"Chen, H., Sun, K., Tian, Z., et al.: BlendMask: top-down meets bottom-up for instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8573\u20138581 (2020)","DOI":"10.1109\/CVPR42600.2020.00860"},{"key":"1668_CR17","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2025.110068","volume":"143","author":"KI Rashid","year":"2025","unstructured":"Rashid, K.I., Yang, C., Huang, C.: Dynamic context-aware high-resolution network for semi-supervised semantic segmentation. Eng. Appl. Artif. Intell. 143, 110068 (2025)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"1668_CR18","unstructured":"Hu, J., Cao, L., Lu, Y., et al.: ISTR: end-to-end instance segmentation with transformers. arXiv preprint arXiv:2105 (2021)"},{"key":"1668_CR19","doi-asserted-by":"crossref","unstructured":"Guo, R., Niu, D., Qu, L., et al.: SOTR: segmenting objects with transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7157\u20137166 (2021)","DOI":"10.1109\/ICCV48922.2021.00707"},{"key":"1668_CR20","first-page":"21898","volume":"34","author":"B Dong","year":"2021","unstructured":"Dong, B., Zeng, F., Wang, T., et al.: SOLQ: segmenting objects by learning queries. Adv. Neural Inf. Process. Syst. 34, 21898\u201321909 (2021)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1668_CR21","doi-asserted-by":"crossref","unstructured":"Cheng, B., Misra, I., Schwing, A.G., et al.: Masked-attention mask transformer for universal image segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1290\u20131299 (2022)","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"1668_CR22","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., et al.: Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10012\u201310022 (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"1668_CR23","doi-asserted-by":"crossref","unstructured":"Jain, J., Li, J., Chiu, M.T., et al.: OneFormer: one transformer to rule universal image segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2989\u20132998 (2023)","DOI":"10.1109\/CVPR52729.2023.00292"},{"key":"1668_CR24","unstructured":"Dosovitskiy, A.: An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"1668_CR25","unstructured":"Radford, A., Kim, J.W., Hallacy. C., et al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748-8763. PMLR (2021)"},{"key":"1668_CR26","unstructured":"Lin, Z., Wang, Y., Tang, Z.: Training-free open-ended object detection and segmentation via attention as prompts. arXiv preprint arXiv:2410.05963 (2024)"},{"key":"1668_CR27","unstructured":"Cordts, M., Omran, M., Ramos, S., et al.: The cityscapes dataset. In: CVPR Workshop on the Future of Datasets in Vision, 2: 1 (2015)"},{"key":"1668_CR28","doi-asserted-by":"crossref","unstructured":"Yu, F., Chen, H., Wang, X., et al.: Bdd100k: a diverse driving dataset for heterogeneous multitask learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2636\u20132645 (2020)","DOI":"10.1109\/CVPR42600.2020.00271"},{"key":"1668_CR29","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Mintun, E., Ravi, N., et al.: Segment anything. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4015\u20134026 ( 2023)","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"1668_CR30","unstructured":"Zhao, X., Ding, W., An, Y., et al.: Fast segment anything. arXiv preprint arXiv:2306.12156 (2023)"},{"key":"1668_CR31","first-page":"25346","volume":"34","author":"M Mao","year":"2021","unstructured":"Mao, M., Zhang, R., Zheng, H., et al.: Dual-stream network for visual recognition. Adv. Neural Inf. Process. Syst. 34, 25346\u201325358 (2021)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1668_CR32","first-page":"21002","volume":"33","author":"X Li","year":"2020","unstructured":"Li, X., Wang, W., Wu, L., et al.: Generalized focal loss: learning qualified and distributed bounding boxes for dense object detection. Adv. Neural Inf. Process. Syst. 33, 21002\u201321012 (2020)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1668_CR33","doi-asserted-by":"crossref","unstructured":"Ruby, U., Yendapalli, V.: Binary cross entropy with deep learning technique for image classification. Int. J. Adv. Trends Comput. Sci. Eng. 9(10) (2020)","DOI":"10.30534\/ijatcse\/2020\/175942020"},{"key":"1668_CR34","doi-asserted-by":"crossref","unstructured":"Wang, W., Xie, E., Li, X., et al.: Pyramid vision transformer: a versatile backbone for dense prediction without convolutions. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 568\u2013578 (2021)","DOI":"10.1109\/ICCV48922.2021.00061"},{"issue":"3","key":"1668_CR35","doi-asserted-by":"publisher","first-page":"415","DOI":"10.1007\/s41095-022-0274-8","volume":"8","author":"W Wang","year":"2022","unstructured":"Wang, W., Xie, E., Li, X., et al.: PVT v2: improved baselines with pyramid vision transformer. Comput. Vis. Media 8(3), 415\u2013424 (2022)","journal-title":"Comput. Vis. Media"},{"key":"1668_CR36","unstructured":"Yu, Z., Huang, H., Chen, W., et al.: YOLO-FaceV2: a scale and occlusion aware face detector. arXiv preprint arXiv:2208.02019 (2022)"},{"key":"1668_CR37","doi-asserted-by":"publisher","first-page":"1169","DOI":"10.1109\/TIP.2020.3042065","volume":"30","author":"T Wu","year":"2020","unstructured":"Wu, T., Tang, S., Zhang, R., et al.: CGNET: a light-weight context guided network for semantic segmentation. IEEE Trans. Image Process. 30, 1169\u20131179 (2020)","journal-title":"IEEE Trans. Image Process."},{"key":"1668_CR38","unstructured":"Vaswani, A.: Attention is all you need. Adv. Neural Inf. Process. Syst. (2017)"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01668-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-025-01668-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01668-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,3]],"date-time":"2025-05-03T06:24:08Z","timestamp":1746253448000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-025-01668-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4]]},"references-count":38,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2025,4]]}},"alternative-id":["1668"],"URL":"https:\/\/doi.org\/10.1007\/s11554-025-01668-0","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,4]]},"assertion":[{"value":"8 February 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 March 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 April 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no relevant financial or non-financial interests to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"93"}}