{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T11:37:22Z","timestamp":1777894642846,"version":"3.51.4"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T00:00:00Z","timestamp":1724112000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T00:00:00Z","timestamp":1724112000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100003392","name":"Natural Science Foundation of Fujian Province","doi-asserted-by":"publisher","award":["2021J01128"],"award-info":[{"award-number":["2021J01128"]}],"id":[{"id":"10.13039\/501100003392","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003392","name":"Natural Science Foundation of Fujian Province","doi-asserted-by":"publisher","award":["2021J01128"],"award-info":[{"award-number":["2021J01128"]}],"id":[{"id":"10.13039\/501100003392","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003392","name":"Natural Science Foundation of Fujian Province","doi-asserted-by":"publisher","award":["2021J01128"],"award-info":[{"award-number":["2021J01128"]}],"id":[{"id":"10.13039\/501100003392","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003392","name":"Natural Science Foundation of Fujian Province","doi-asserted-by":"publisher","award":["2021J01128"],"award-info":[{"award-number":["2021J01128"]}],"id":[{"id":"10.13039\/501100003392","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Research Institute of Xi Jinping Ecological Civilization, Fujian Agriculture and Forestry University","award":["STWMSX23-10"],"award-info":[{"award-number":["STWMSX23-10"]}]},{"name":"Research Institute of Xi Jinping Ecological Civilization, Fujian Agriculture and Forestry University","award":["STWMSX23-10"],"award-info":[{"award-number":["STWMSX23-10"]}]},{"name":"Research Institute of Xi Jinping Ecological Civilization, Fujian Agriculture and Forestry University","award":["STWMSX23-10"],"award-info":[{"award-number":["STWMSX23-10"]}]},{"name":"Research Institute of Xi Jinping Ecological Civilization, Fujian Agriculture and Forestry University","award":["STWMSX23-10"],"award-info":[{"award-number":["STWMSX23-10"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2024,10]]},"DOI":"10.1007\/s00530-024-01438-1","type":"journal-article","created":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T07:03:37Z","timestamp":1724137417000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Gateinst: instance segmentation with multi-scale gated-enhanced queries in transformer decoder"],"prefix":"10.1007","volume":"30","author":[{"given":"Chih-Wei","family":"Lin","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ye","family":"Lin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shangtai","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lirong","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,8,20]]},"reference":[{"key":"1438_CR1","doi-asserted-by":"crossref","unstructured":"Bolya, D., Zhou, C., Xiao, F., et\u00a0al.: Yolact: Real-time instance segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 9157\u20139166 (2019)","DOI":"10.1109\/ICCV.2019.00925"},{"issue":"5","key":"1438_CR2","doi-asserted-by":"publisher","first-page":"1483","DOI":"10.1109\/TPAMI.2019.2956516","volume":"43","author":"Z Cai","year":"2019","unstructured":"Cai, Z., Vasconcelos, N.: Cascade r-cnn: High quality object detection and instance segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 43(5), 1483\u20131498 (2019)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1438_CR3","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., et\u00a0al.: End-to-end object detection with transformers. In: Proceedings of the European Conference on Computer Vision, Springer, pp 213\u2013229 (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"1438_CR4","doi-asserted-by":"crossref","unstructured":"Chen, K., Pang, J., Wang, J., et\u00a0al.: Hybrid task cascade for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2019a)","DOI":"10.1109\/CVPR.2019.00511"},{"key":"1438_CR5","unstructured":"Chen, K., Wang, J., Pang, J., et\u00a0al.: MMDetection: Open mmlab detection toolbox and benchmark. arXiv preprint arXiv:1906.07155 (2019b)"},{"key":"1438_CR6","doi-asserted-by":"crossref","unstructured":"Chen, L.C., Papandreou, G., Schroff, F., et\u00a0al.: Rethinking atrous convolution for semantic image segmentation (2017)","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"1438_CR7","unstructured":"Cheng, B., Schwing, A.G., Kirillov, A.: Per-pixel classification is not all you need for semantic segmentation (2021)"},{"key":"1438_CR8","doi-asserted-by":"crossref","unstructured":"Cheng, B., Misra, I., Schwing, A.G., et\u00a0al.: Masked-attention mask transformer for universal image segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 1290\u20131299 (2022a)","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"1438_CR9","doi-asserted-by":"crossref","unstructured":"Cheng, T., Wang, X., Chen, S., et\u00a0al.: Sparse instance activation for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 4433\u20134442 (2022b)","DOI":"10.1109\/CVPR52688.2022.00439"},{"key":"1438_CR10","unstructured":"Cui, Y., Yang, L., Yu, H.: Dq-det: Learning dynamic query combinations for transformer-based object detection and segmentation. arXiv preprint arXiv:2307.12239 (2023a)"},{"key":"1438_CR11","unstructured":"Cui, Y., Yang, L., Yu, H.: (2023b) Learning dynamic query combinations for transformer-based object detection and segmentation"},{"key":"1438_CR12","doi-asserted-by":"crossref","unstructured":"Dai, X., Chen, Y., Yang, J., et\u00a0al.: Dynamic detr: End-to-end object detection with dynamic attention. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 2988\u20132997 (2021)","DOI":"10.1109\/ICCV48922.2021.00298"},{"key":"1438_CR13","doi-asserted-by":"crossref","unstructured":"Gao, N., Shan, Y., Wang, Y., et\u00a0al.: Ssap: Single-shot instance segmentation with affinity pyramid. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 642\u2013651 (2019)","DOI":"10.1109\/ICCV.2019.00073"},{"key":"1438_CR14","doi-asserted-by":"crossref","unstructured":"Gao, P., Zheng, M., Wang, X., et\u00a0al.: Fast convergence of detr with spatially modulated co-attention. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 3621\u20133630 (2021)","DOI":"10.1109\/ICCV48922.2021.00360"},{"key":"1438_CR15","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2022.104401","volume":"120","author":"W Gu","year":"2022","unstructured":"Gu, W., Bai, S., Kong, L.: A review on 2d instance segmentation based on deep neural networks. Image Vis. Comput. 120, 104401 (2022)","journal-title":"Image Vis. Comput."},{"key":"1438_CR16","unstructured":"Gu, Z., Chen, H., Xu, Z., et\u00a0al.: Diffusioninst: Diffusion model for instance segmentation. arXiv preprint arXiv:2212.02773 (2022b)"},{"key":"1438_CR17","doi-asserted-by":"crossref","unstructured":"He, J., Li, P., Geng, Y., et\u00a0al.: Fastinst: A simple query-based model for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 23663\u201323672 (2023)","DOI":"10.1109\/CVPR52729.2023.02266"},{"key":"1438_CR18","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., et\u00a0al.: Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"1438_CR19","unstructured":"Hu, J., Cao, L., Lu, Y., et\u00a0al.: Istr: End-to-end instance segmentation with transformers. arXiv preprint arXiv:2105.00637 (2021)"},{"key":"1438_CR20","doi-asserted-by":"crossref","unstructured":"Huang, Z., Huang, L., Gong, Y., et\u00a0al.: Mask scoring r-cnn. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6409\u20136418 (2019)","DOI":"10.1109\/CVPR.2019.00657"},{"issue":"10","key":"1438_CR21","doi-asserted-by":"publisher","first-page":"8275","DOI":"10.1007\/s00521-021-05978-9","volume":"34","author":"P Hurtik","year":"2022","unstructured":"Hurtik, P., Molek, V., Hula, J., et al.: Poly-yolo: higher speed, more precise detection and instance segmentation for yolov3. Neural Comput. Appl. 34(10), 8275\u20138290 (2022)","journal-title":"Neural Comput. Appl."},{"key":"1438_CR22","doi-asserted-by":"crossref","unstructured":"Ke, L., Danelljan, M., Li, X., et\u00a0al.: Mask transfiner for high-quality instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 4412\u20134421 (2022)","DOI":"10.1109\/CVPR52688.2022.00437"},{"key":"1438_CR23","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Maire, M., Belongie, S., et\u00a0al.: Microsoft coco: Common objects in context. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13, Springer, pp 740\u2013755 (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"1438_CR24","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., et\u00a0al.: Feature pyramid networks for object detection. arXiv e-prints (2016)","DOI":"10.1109\/CVPR.2017.106"},{"key":"1438_CR25","unstructured":"Liu, S., Li, F., Zhang, H., et\u00a0al.: Dab-detr: Dynamic anchor boxes are better queries for detr. arXiv preprint arXiv:2201.12329 (2022)"},{"key":"1438_CR26","doi-asserted-by":"crossref","unstructured":"Long, Jonathan, Shelhamer, et\u00a0al.: Fully convolutional networks for semantic segmentation. IEEE Transactions on Pattern Analysis and Machine Intelligence (2017)","DOI":"10.1109\/TPAMI.2016.2572683"},{"key":"1438_CR27","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101 (2017)"},{"key":"1438_CR28","unstructured":"Lyu, C., Zhang, W., Huang, H., et\u00a0al.: Rtmdet: An empirical study of designing real-time object detectors. arXiv preprint arXiv:2212.07784 (2022)"},{"key":"1438_CR29","doi-asserted-by":"crossref","unstructured":"Meng, D., Chen, X., Fan, Z., et\u00a0al.: Conditional detr for fast training convergence. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 3651\u20133660 (2021)","DOI":"10.1109\/ICCV48922.2021.00363"},{"key":"1438_CR30","unstructured":"Redmon, J., Farhadi, A.: Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767 (2018)"},{"key":"1438_CR31","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., et\u00a0al.: You only look once: Unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"1438_CR32","unstructured":"Ren, S., He, K., Girshick, R., et\u00a0al.: Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in Neural Information Processing Systems 28 (2015)"},{"key":"1438_CR33","unstructured":"Roh, B., Shin, J., Shin, W., et\u00a0al.; Sparse detr: Efficient end-to-end object detection with learnable sparsity. arXiv preprint arXiv:2111.14330 (2021)"},{"key":"1438_CR34","doi-asserted-by":"crossref","unstructured":"Samet, N., Hicsonmez, S., Akbas, E.: Houghnet: Integrating near and long-range evidence for bottom-up object detection. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXV 16, Springer, pp 406\u2013423 (2020)","DOI":"10.1007\/978-3-030-58595-2_25"},{"key":"1438_CR35","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Ioffe, S., Vanhoucke, V., et\u00a0al.: Inception-v4, inception-resnet and the impact of residual connections on learning (2016)","DOI":"10.1609\/aaai.v31i1.11231"},{"key":"1438_CR36","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H., et\u00a0al.: Fcos: Fully convolutional one-stage object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 9627\u20139636 (2019)","DOI":"10.1109\/ICCV.2019.00972"},{"key":"1438_CR37","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H.: Conditional convolutions for instance segmentation. In: Proceedings of the European Conference on Computer Vision (2020)","DOI":"10.1007\/978-3-030-58452-8_17"},{"key":"1438_CR38","doi-asserted-by":"crossref","unstructured":"Wang, T., Yuan, L., Chen, Y., et\u00a0al.: Pnp-detr: Towards efficient visual analysis with transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 4661\u20134670 (2021)","DOI":"10.1109\/ICCV48922.2021.00462"},{"key":"1438_CR39","first-page":"17721","volume":"33","author":"X Wang","year":"2020","unstructured":"Wang, X., Zhang, R., Kong, T., et al.: Solov2: Dynamic and fast instance segmentation. Adv. Neural. Inf. Process. Syst. 33, 17721\u201317732 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1438_CR40","doi-asserted-by":"crossref","unstructured":"Wang, Y., Zhang, X., Yang, T., et\u00a0al.: Anchor detr: Query design for transformer-based detector. In: Proceedings of the AAAI conference on artificial intelligence, pp 2567\u20132575 (2022)","DOI":"10.1609\/aaai.v36i3.20158"},{"key":"1438_CR41","doi-asserted-by":"crossref","unstructured":"Woo, S., Debnath, S., Hu, R., et\u00a0al.: Convnext v2: Co-designing and scaling convnets with masked autoencoders. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 16133\u201316142 (2023)","DOI":"10.1109\/CVPR52729.2023.01548"},{"key":"1438_CR42","doi-asserted-by":"crossref","unstructured":"Yang, R., Song, L., Ge, Y., et\u00a0al.: Boxsnake: Polygonal instance segmentation with box supervision. arXiv:2303.11630 (2023)","DOI":"10.1109\/ICCV51070.2023.00077"},{"key":"1438_CR43","unstructured":"Yao, Z., Ai, J., Li, B., et\u00a0al.: Efficient detr: improving end-to-end object detector with dense prior. arXiv preprint arXiv:2104.01318 (2021)"},{"key":"1438_CR44","doi-asserted-by":"crossref","unstructured":"Yu, Q., Wang, H., Kim, D., et\u00a0al.: Cmt-deeplab: Clustering mask transformers for panoptic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 2560\u20132570 (2022)","DOI":"10.1109\/CVPR52688.2022.00259"},{"key":"1438_CR45","doi-asserted-by":"crossref","unstructured":"Zhang, G., Lu, X., Tan, J., et\u00a0al.: Refinemask: Towards high-quality instance segmentation with fine-grained features. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6861\u20136869 (2021)","DOI":"10.1109\/CVPR46437.2021.00679"},{"key":"1438_CR46","unstructured":"Zhang, G., Li, Z., Li, J., et\u00a0al.: Cfnet: Cascade fusion network for dense prediction. arXiv preprint arXiv:2302.06052 (2023)"},{"key":"1438_CR47","doi-asserted-by":"crossref","unstructured":"Zheng, D., Dong, W., Hu, H., et\u00a0al.: Less is more: Focus attention for efficient detr. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 6674\u20136683 (2023)","DOI":"10.1109\/ICCV51070.2023.00614"},{"key":"1438_CR48","unstructured":"Zheng, M., Gao, P., Zhang, R., et\u00a0al.: End-to-end object detection with adaptive clustering transformer. arXiv preprint arXiv:2011.09315 (2020)"},{"key":"1438_CR49","doi-asserted-by":"crossref","unstructured":"Zheng, S., Lu, J., Zhao, H., et\u00a0al.: Rethinking semantic segmentation from a sequence-to-sequence perspective with transformers. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 6881\u20136890 (2021)","DOI":"10.1109\/CVPR46437.2021.00681"},{"key":"1438_CR50","unstructured":"Zhu, X., Su, W., Lu, L., et\u00a0al.: Deformable detr: Deformable transformers for end-to-end object detection. arXiv preprint arXiv:2010.04159 (2020)"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01438-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-024-01438-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01438-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T18:09:52Z","timestamp":1730138992000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-024-01438-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,20]]},"references-count":50,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2024,10]]}},"alternative-id":["1438"],"URL":"https:\/\/doi.org\/10.1007\/s00530-024-01438-1","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,8,20]]},"assertion":[{"value":"12 December 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 July 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 August 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"252"}}