{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T16:35:15Z","timestamp":1775666115871,"version":"3.50.1"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T00:00:00Z","timestamp":1716854400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T00:00:00Z","timestamp":1716854400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"crossref","award":["2019YFE0105400"],"award-info":[{"award-number":["2019YFE0105400"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"crossref","award":["2019YFE0105400"],"award-info":[{"award-number":["2019YFE0105400"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"crossref","award":["2019YFE0105400"],"award-info":[{"award-number":["2019YFE0105400"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Intelligent Situation Awareness System for Smart Ship","award":["MC-201920-X01"],"award-info":[{"award-number":["MC-201920-X01"]}]},{"name":"Intelligent Situation Awareness System for Smart Ship","award":["MC-201920-X01"],"award-info":[{"award-number":["MC-201920-X01"]}]},{"name":"Intelligent Situation Awareness System for Smart Ship","award":["MC-201920-X01"],"award-info":[{"award-number":["MC-201920-X01"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2024,8]]},"DOI":"10.1007\/s11554-024-01479-9","type":"journal-article","created":{"date-parts":[[2024,5,28]],"date-time":"2024-05-28T05:01:45Z","timestamp":1716872505000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["AM YOLO: adaptive multi-scale YOLO for ship instance segmentation"],"prefix":"10.1007","volume":"21","author":[{"given":"Ming","family":"Yuan","sequence":"first","affiliation":[]},{"given":"Hao","family":"Meng","sequence":"additional","affiliation":[]},{"given":"Junbao","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,5,28]]},"reference":[{"key":"1479_CR1","doi-asserted-by":"publisher","first-page":"1803","DOI":"10.1007\/s11554-021-01144-5","volume":"18","author":"I Ahmed","year":"2021","unstructured":"Ahmed, I., Jeon, G.: A real-time person tracking system based on siammask network for intelligent video surveillance. J. Real Time Image Process. 18, 1803\u20131814 (2021)","journal-title":"J. Real Time Image Process."},{"key":"1479_CR2","doi-asserted-by":"publisher","first-page":"71576","DOI":"10.1109\/ACCESS.2019.2918650","volume":"7","author":"S Basalamah","year":"2019","unstructured":"Basalamah, S., Khan, S.D., Ullah, H.: Scale driven convolutional neural network model for people counting and localization in crowd scenes. IEEE Access 7, 71576\u201371584 (2019)","journal-title":"IEEE Access"},{"issue":"3","key":"1479_CR3","first-page":"3798","volume":"45","author":"J Cao","year":"2022","unstructured":"Cao, J., Pang, Y., Anwer, R.M., Cholakkal, H., Khan, F.S., Shao, L.: Sipmaskv2: enhanced fast image and video instance segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 45(3), 3798\u20133812 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1479_CR4","doi-asserted-by":"crossref","unstructured":"Chen, H., Sun, K., Tian, Z., Shen, C., Huang, Y., Yan, Y.: Blendmask: Top-down meets bottom-up for instance segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 8573\u20138581 (2020)","DOI":"10.1109\/CVPR42600.2020.00860"},{"key":"1479_CR5","unstructured":"Chen, X., Fang, H., Lin, T.Y., Vedantam, R., Gupta, S., Doll\u00e1r, P., Zitnick, C.L.: Microsoft coco captions: Data collection and evaluation server. arXiv preprint arXiv:1504.00325 (2015)"},{"key":"1479_CR6","doi-asserted-by":"crossref","unstructured":"Cheng, B., Misra, I., Schwing, A.G., Kirillov, A., Girdhar, R.: Masked-attention mask transformer for universal image segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 1290\u20131299 (2022)","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"1479_CR7","doi-asserted-by":"crossref","unstructured":"Cheng, T., Wang, X., Chen, S., Zhang, W., Zhang, Q., Huang, C., Zhang, Z., Liu, W.: Sparse instance activation for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4433\u20134442 (2022)","DOI":"10.1109\/CVPR52688.2022.00439"},{"issue":"6","key":"1479_CR8","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1007\/s11554-023-01372-x","volume":"20","author":"W Gtifa","year":"2023","unstructured":"Gtifa, W., Sakly, A.: Integrating xilinx fpga and intelligent techniques for improved precision in 3d brain tumor segmentation in medical imaging. J. Real Time Image Process. 20(6), 115 (2023)","journal-title":"J. Real Time Image Process."},{"key":"1479_CR9","doi-asserted-by":"crossref","unstructured":"Han, K., Wang, Y., Tian, Q., Guo, J., Xu, C., Xu, C.: Ghostnet: More features from cheap operations. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 1580\u20131589 (2020)","DOI":"10.1109\/CVPR42600.2020.00165"},{"key":"1479_CR10","doi-asserted-by":"crossref","unstructured":"He, J., Li, P., Geng, Y., Xie, X.: Fastinst: A simple query-based model for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 23663\u201323672 (2023)","DOI":"10.1109\/CVPR52729.2023.02266"},{"key":"1479_CR11","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"1479_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/LGRS.2020.3011973","volume":"19","author":"W Huang","year":"2021","unstructured":"Huang, W., Li, G., Jin, B., Chen, Q., Yin, J., Huang, L.: Scenario context-aware-based bidirectional feature pyramid network for remote sensing target detection. IEEE Geosci. Remote Sens. Lett. 19, 1\u20135 (2021)","journal-title":"IEEE Geosci. Remote Sens. Lett."},{"key":"1479_CR13","doi-asserted-by":"crossref","unstructured":"Huang, Z., Huang, L., Gong, Y., Huang, C., Wang, X.: Mask scoring r-cnn. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6409\u20136418 (2019)","DOI":"10.1109\/CVPR.2019.00657"},{"key":"1479_CR14","unstructured":"Jocher, G., Chaurasia, A., Stoken, A., Borovec, J., Kwon, Y., Michael, K., Fang, J., Yifu, Z., Wong, C., Montes, D., et\u00a0al.: ultralytics\/yolov5: v7. 0-yolov5 sota realtime instance segmentation. Zenodo (2022)"},{"issue":"8","key":"1479_CR15","doi-asserted-by":"publisher","first-page":"9489","DOI":"10.1007\/s13369-021-06288-x","volume":"47","author":"SD Khan","year":"2022","unstructured":"Khan, S.D., Alarabi, L., Basalamah, S.: A unified deep learning framework of multi-scale detectors for geo-spatial object detection in high-resolution satellite images. Arab. J. Sci. Eng. 47(8), 9489\u20139504 (2022)","journal-title":"Arab. J. Sci. Eng."},{"issue":"3","key":"1479_CR16","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1007\/s11554-023-01310-x","volume":"20","author":"CL Kim","year":"2023","unstructured":"Kim, C.L., Kim, B.G.: Few-shot learning for facial expression recognition: a comprehensive survey. J. Real Time Image Process. 20(3), 52 (2023)","journal-title":"J. Real Time Image Process."},{"key":"1479_CR17","doi-asserted-by":"publisher","first-page":"7389","DOI":"10.1109\/TIP.2020.3002345","volume":"29","author":"T Kong","year":"2020","unstructured":"Kong, T., Sun, F., Liu, H., Jiang, Y., Li, L., Shi, J.: Foveabox: beyound anchor-based object detection. IEEE Trans. Image Process. 29, 7389\u20137398 (2020)","journal-title":"IEEE Trans. Image Process."},{"key":"1479_CR18","doi-asserted-by":"crossref","unstructured":"Lan, S., Ren, Z., Wu, Y., Davis, L.S., Hua, G.: Saccadenet: a fast and accurate object detector. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10397\u201310406 (2020)","DOI":"10.1109\/CVPR42600.2020.01041"},{"key":"1479_CR19","doi-asserted-by":"crossref","unstructured":"Liu, Y., Li, H., Hu, C., Luo, S., Luo, Y., Chen, C.W.: Learning to aggregate multi-scale context for instance segmentation in remote sensing images. IEEE Trans. Neural Netw. Learn. Syst. (2024)","DOI":"10.1109\/TNNLS.2023.3336563"},{"key":"1479_CR20","doi-asserted-by":"crossref","unstructured":"Lu, X., Li, B., Yue, Y., Li, Q., Yan, J.: Grid r-cnn. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7363\u20137372 (2019)","DOI":"10.1109\/CVPR.2019.00754"},{"key":"1479_CR21","doi-asserted-by":"crossref","unstructured":"Pang, J., Chen, K., Shi, J., Feng, H., Ouyang, W., Lin, D.: Libra r-cnn: Towards balanced learning for object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 821\u2013830 (2019)","DOI":"10.1109\/CVPR.2019.00091"},{"key":"1479_CR22","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. Adv. Neural Inform. Process. Syst. 28 (2015)"},{"issue":"1","key":"1479_CR23","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1109\/TCSVT.2020.2978194","volume":"31","author":"Y Shan","year":"2020","unstructured":"Shan, Y., Zhou, X., Liu, S., Zhang, Y., Huang, K.: Siamfpn: a deep learning method for accurate and real-time maritime ship tracking. IEEE Trans. Circ. Syst. Video Technol. 31(1), 315\u2013325 (2020)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"1479_CR24","doi-asserted-by":"crossref","unstructured":"Sun, P., Zhang, R., Jiang, Y., Kong, T., Xu, C., Zhan, W., Tomizuka, M., Li, L., Yuan, Z., Wang, C., et\u00a0al.: Sparse r-cnn: End-to-end object detection with learnable proposals. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 14454\u201314463 (2021)","DOI":"10.1109\/CVPR46437.2021.01422"},{"issue":"1","key":"1479_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13677-020-00203-9","volume":"9","author":"W Sun","year":"2020","unstructured":"Sun, W., Zhang, X., He, X.: Lightweight image classifier using dilated and depthwise separable convolutions. J. Cloud Comput. 9(1), 1\u201312 (2020)","journal-title":"J. Cloud Comput."},{"key":"1479_CR26","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H.: Conditional convolutions for instance segmentation. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I 16, pp. 282\u2013298. Springer (2020)","DOI":"10.1007\/978-3-030-58452-8_17"},{"key":"1479_CR27","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H., He, T.: Fcos: Fully convolutional one-stage object detection. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9627\u20139636 (2019)","DOI":"10.1109\/ICCV.2019.00972"},{"key":"1479_CR28","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Wang, X., Chen, H.: Boxinst: High-performance instance segmentation with box annotations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5443\u20135452 (2021)","DOI":"10.1109\/CVPR46437.2021.00540"},{"issue":"2","key":"1479_CR29","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1007\/s11554-023-01296-6","volume":"20","author":"C Wang","year":"2023","unstructured":"Wang, C., Zhong, J., Dai, Q., Qi, Y., Shi, F., Fang, B., Li, X.: Multi-view knowledge distillation for efficient semantic segmentation. J. Real Time Image Process. 20(2), 39 (2023)","journal-title":"J. Real Time Image Process."},{"key":"1479_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.infrared.2021.103965","volume":"119","author":"D Wang","year":"2021","unstructured":"Wang, D., Lan, J.: Ppdet: a novel infrared pedestrian detection network in a per-pixel prediction fashion. Infrar. Phys. Technol. 119, 103965 (2021)","journal-title":"Infrar. Phys. Technol."},{"key":"1479_CR31","doi-asserted-by":"crossref","unstructured":"Wang, K., Liew, J.H., Zou, Y., Zhou, D., Feng, J.: Panet: Few-shot image semantic segmentation with prototype alignment. In: proceedings of the IEEE\/CVF international conference on computer vision, pp. 9197\u20139206 (2019)","DOI":"10.1109\/ICCV.2019.00929"},{"key":"1479_CR32","doi-asserted-by":"crossref","unstructured":"Wang, X., Feng, J., Hu, B., Ding, Q., Ran, L., Chen, X., Liu, W.: Weakly-supervised instance segmentation via class-agnostic learning with salient images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10225\u201310235 (2021)","DOI":"10.1109\/CVPR46437.2021.01009"},{"key":"1479_CR33","doi-asserted-by":"crossref","unstructured":"Wang, X., Yu, Z., De\u00a0Mello, S., Kautz, J., Anandkumar, A., Shen, C., Alvarez, J.M.: Freesolo: Learning to segment objects without annotations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14176\u201314186 (2022)","DOI":"10.1109\/CVPR52688.2022.01378"},{"key":"1479_CR34","first-page":"17721","volume":"33","author":"X Wang","year":"2020","unstructured":"Wang, X., Zhang, R., Kong, T., Li, L., Shen, C.: Solov2: dynamic and fast instance segmentation. Adv. Neural Inform. Process. Syst. 33, 17721\u201317732 (2020)","journal-title":"Adv. Neural Inform. Process. Syst."},{"key":"1479_CR35","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y., Kweon, I.S.: Cbam: Convolutional block attention module. In: Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"1479_CR36","doi-asserted-by":"crossref","unstructured":"Xie, E., Sun, P., Song, X., Wang, W., Liu, X., Liang, D., Shen, C., Luo, P.: Polarmask: Single shot instance segmentation with polar representation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12193\u201312202 (2020)","DOI":"10.1109\/CVPR42600.2020.01221"},{"key":"1479_CR37","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1016\/j.neucom.2021.09.061","volume":"467","author":"H Yang","year":"2022","unstructured":"Yang, H., Zheng, L., Barzegar, S.G., Zhang, Y., Xu, B.: Borderpointsmask: one-stage instance segmentation with boundary points representation. Neurocomputing 467, 348\u2013359 (2022)","journal-title":"Neurocomputing"},{"key":"1479_CR38","doi-asserted-by":"crossref","unstructured":"Zang, Y., Huang, C., Loy, C.C.: Fasa: feature augmentation and sampling adaptation for long-tailed instance segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3457\u20133466 (2021)","DOI":"10.1109\/ICCV48922.2021.00344"},{"key":"1479_CR39","doi-asserted-by":"crossref","unstructured":"Zhang, G., Lu, X., Tan, J., Li, J., Zhang, Z., Li, Q., Hu, X.: Refinemask: towards high-quality instance segmentation with fine-grained features. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6861\u20136869 (2021)","DOI":"10.1109\/CVPR46437.2021.00679"},{"key":"1479_CR40","doi-asserted-by":"crossref","unstructured":"Zhang, R., Cheng, T., Yang, S., Jiang, H., Zhang, S., Lyu, J., Li, X., Ying, X., Gao, D., Liu, W., et\u00a0al.: Mobileinst: Video instance segmentation on the mobile. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a038, pp. 7260\u20137268 (2024)","DOI":"10.1609\/aaai.v38i7.28555"},{"key":"1479_CR41","doi-asserted-by":"crossref","unstructured":"Zhang, R., Tian, Z., Shen, C., You, M., Yan, Y.: Mask encoding for single shot instance segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10226\u201310235 (2020)","DOI":"10.1109\/CVPR42600.2020.01024"},{"key":"1479_CR42","doi-asserted-by":"crossref","unstructured":"Zhang, T., Wei, S., Ji, S.: E2ec: an end-to-end contour-based method for high-quality high-speed instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4443\u20134452 (2022)","DOI":"10.1109\/CVPR52688.2022.00440"},{"key":"1479_CR43","volume-title":"Yolact++ Better Real-Time Instance Segmentation","author":"C Zhou","year":"2020","unstructured":"Zhou, C.: Yolact++ Better Real-Time Instance Segmentation. University of California, Davis (2020)"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-024-01479-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-024-01479-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-024-01479-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,27]],"date-time":"2024-08-27T16:21:09Z","timestamp":1724775669000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-024-01479-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,28]]},"references-count":43,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,8]]}},"alternative-id":["1479"],"URL":"https:\/\/doi.org\/10.1007\/s11554-024-01479-9","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,5,28]]},"assertion":[{"value":"5 March 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 May 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 May 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no Conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"100"}}