{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,19]],"date-time":"2026-01-19T04:36:22Z","timestamp":1768797382897,"version":"3.49.0"},"reference-count":54,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2024,9,25]],"date-time":"2024-09-25T00:00:00Z","timestamp":1727222400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,9,25]],"date-time":"2024-09-25T00:00:00Z","timestamp":1727222400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2025,4]]},"DOI":"10.1007\/s00371-024-03653-3","type":"journal-article","created":{"date-parts":[[2024,9,25]],"date-time":"2024-09-25T21:33:08Z","timestamp":1727299988000},"page":"4171-4181","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A dynamic attention mechanism for object detection in road or strip environments"],"prefix":"10.1007","volume":"41","author":[{"given":"Guowei","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Weidong","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wuzhi","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Li","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huankang","family":"Cui","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,9,25]]},"reference":[{"key":"3653_CR1","doi-asserted-by":"crossref","unstructured":"Qi, Y., He, Y., Qi, X., Zhang, Y., Yang, G.: Dynamic snake convolution based on topological geometric constraints for tubular structure segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6070\u20136079 (2023)","DOI":"10.1109\/ICCV51070.2023.00558"},{"key":"3653_CR2","doi-asserted-by":"publisher","first-page":"7192","DOI":"10.1109\/TIP.2020.2999854","volume":"29","author":"A Nazir","year":"2020","unstructured":"Nazir, A., Cheema, M.N., Sheng, B., Li, H., Li, P., Yang, P., Jung, Y., Qin, J., Kim, J., Feng, D.D.: Off-enet: an optimally fused fully end-to-end network for automatic dense volumetric 3d intracranial blood vessels segmentation. IEEE Trans. Image Process. 29, 7192\u20137202 (2020)","journal-title":"IEEE Trans. Image Process."},{"key":"3653_CR3","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: European Conference on Computer Vision, Springer pp. 213\u2013229 (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"3653_CR4","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., Dai, J.: Deformable detr: Deformable transformers for end-to-end object detection. arXiv preprint arXiv:2010.04159 (2020)"},{"key":"3653_CR5","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., Zitnick, C.L.: Microsoft coco: Common objects in context. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13, pp. 740\u2013755 (2014). Springer","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"3653_CR6","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need. Adv. Neural Inf. Process. Syst. 30 (2017)"},{"key":"3653_CR7","doi-asserted-by":"crossref","unstructured":"Tay, Y., Dehghani, M., Bahri, D., Metzler, D.: Efficient transformers: a survey. ACM Comput. Surv. 55(6), 1\u201328 (2022)","DOI":"10.1145\/3530811"},{"key":"3653_CR8","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/TMM.2021.3120873","volume":"25","author":"X Lin","year":"2021","unstructured":"Lin, X., Sun, S., Huang, W., Sheng, B., Li, P., Feng, D.D.: Eapt: efficient attention pyramid transformer for image processing. IEEE Trans. Multimed. 25, 50\u201361 (2021)","journal-title":"IEEE Trans. Multimed."},{"key":"3653_CR9","unstructured":"Liu, P.J., Saleh, M., Pot, E., Goodrich, B., Sepassi, R., Kaiser, L., Shazeer, N.: Generating wikipedia by summarizing long sequences. arXiv preprint arXiv:1801.10198 (2018)"},{"key":"3653_CR10","unstructured":"Parmar, N., Vaswani, A., Uszkoreit, J., Kaiser, \u0141., Shazeer, N.: Alexander ku and dustin tran. image transformer. arXiv preprint arXiv: 1802.05751 (2018)"},{"key":"3653_CR11","unstructured":"Child, R., Gray, S., Radford, A., Sutskever, I.: Generating long sequences with sparse transformers. arXiv preprint arXiv:1904.10509 (2019)"},{"key":"3653_CR12","doi-asserted-by":"crossref","unstructured":"Huang, Z., Wang, X., Huang, L., Huang, C., Wei, Y., Liu, W.: Ccnet: Criss-cross attention for semantic segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 603\u2013612 (2019)","DOI":"10.1109\/ICCV.2019.00069"},{"key":"3653_CR13","unstructured":"Ho, J., Kalchbrenner, N., Weissenborn, D., Salimans, T.: Axial attention in multidimensional transformers. arXiv preprint arXiv:1912.12180 (2019)"},{"key":"3653_CR14","doi-asserted-by":"crossref","unstructured":"Wang, H., Zhu, Y., Green, B., Adam, H., Yuille, A., Chen, L.-C.: Axial-deeplab: stand-alone axial-attention for panoptic segmentation. In: European conference on computer vision, Springer pp. 108\u2013126 (2020)","DOI":"10.1007\/978-3-030-58548-8_7"},{"key":"3653_CR15","doi-asserted-by":"crossref","unstructured":"Hu, H., Zhang, Z., Xie, Z., Lin, S.: Local relation networks for image recognition. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 3464\u20133473 (2019)","DOI":"10.1109\/ICCV.2019.00356"},{"key":"3653_CR16","unstructured":"Ramachandran, P., Parmar, N., Vaswani, A., Bello, I., Levskaya, A., Shlens, J.: Stand-alone self-attention in vision models. Adv. Neural Inf. Process. Syst. 32 (2019)"},{"key":"3653_CR17","doi-asserted-by":"crossref","unstructured":"Qiu, J., Ma, H., Levy, O., Yih, S.W.-t., Wang, S., Tang, J.: Blockwise self-attention for long document understanding. arXiv preprint arXiv:1911.02972 (2019)","DOI":"10.18653\/v1\/2020.findings-emnlp.232"},{"key":"3653_CR18","unstructured":"Beltagy, I., Peters, M.E., Cohan, A.: Longformer: The long-document transformer. arXiv preprint arXiv:2004.05150 (2020)"},{"key":"3653_CR19","doi-asserted-by":"crossref","unstructured":"Ainslie, J., Ontanon, S., Alberti, C., Cvicek, V., Fisher, Z., Pham, P., Ravula, A., Sanghai, S., Wang, Q., Yang, L.: Etc: Encoding long and structured inputs in transformers. arXiv preprint arXiv:2004.08483 (2020)","DOI":"10.18653\/v1\/2020.emnlp-main.19"},{"key":"3653_CR20","first-page":"17283","volume":"33","author":"M Zaheer","year":"2020","unstructured":"Zaheer, M., Guruganesh, G., Dubey, K.A., Ainslie, J., Alberti, C., Ontanon, S., Pham, P., Ravula, A., Wang, Q., Yang, L., et al.: Big bird: transformers for longer sequences. Adv. Neural Inf. Process. Syst. 33, 17283\u201317297 (2020)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"3653_CR21","doi-asserted-by":"crossref","unstructured":"Cao, H., Qu, Z., Chen, G., Li, X., Thiele, L., Knoll, A.: Ghostvit: expediting vision transformers via cheap operations. IEEE Trans. Artif. Intell. (2023)","DOI":"10.1109\/TAI.2023.3326795"},{"key":"3653_CR22","unstructured":"Kitaev, N., Kaiser, \u0141., Levskaya, A.: Reformer: the efficient transformer. arXiv preprint arXiv:2001.04451 (2020)"},{"key":"3653_CR23","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1162\/tacl_a_00353","volume":"9","author":"A Roy","year":"2021","unstructured":"Roy, A., Saffar, M., Vaswani, A., Grangier, D.: Efficient content-based sparse attention with routing transformers. Trans. Assoc. Comput. Linguist. 9, 53\u201368 (2021)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"3653_CR24","unstructured":"Tay, Y., Bahri, D., Yang, L., Metzler, D., Juan, D.-C.: Sparse sinkhorn attention. In: International conference on machine learning, pp. 9438\u20139447 (2020). PMLR"},{"key":"3653_CR25","doi-asserted-by":"crossref","unstructured":"Zhu, X., Cheng, D., Zhang, Z., Lin, S., Dai, J.: An empirical study of spatial attention mechanisms in deep networks. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6688\u20136697 (2019)","DOI":"10.1109\/ICCV.2019.00679"},{"key":"3653_CR26","doi-asserted-by":"crossref","unstructured":"Dai, J., Qi, H., Xiong, Y., Li, Y., Zhang, G., Hu, H., Wei, Y.: Deformable convolutional networks. In: Proceedings of the IEEE international conference on computer vision, pp. 764\u2013773 (2017)","DOI":"10.1109\/ICCV.2017.89"},{"key":"3653_CR27","doi-asserted-by":"crossref","unstructured":"Zhu, X., Hu, H., Lin, S., Dai, J.: Deformable convnets v2: more deformable, better results. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9308\u20139316 (2019)","DOI":"10.1109\/CVPR.2019.00953"},{"key":"3653_CR28","unstructured":"Wu, F., Fan, A., Baevski, A., Dauphin, Y.N., Auli, M.: Pay less attention with lightweight and dynamic convolutions. arXiv preprint arXiv:1901.10430 (2019)"},{"key":"3653_CR29","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"3653_CR30","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path aggregation network for instance segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"key":"3653_CR31","doi-asserted-by":"crossref","unstructured":"Kong, T., Sun, F., Tan, C., Liu, H., Huang, W.: Deep feature pyramid reconfiguration for object detection. In: Proceedings of the European conference on computer vision (ECCV), pp. 169\u2013185 (2018)","DOI":"10.1007\/978-3-030-01228-1_11"},{"key":"3653_CR32","doi-asserted-by":"crossref","unstructured":"Zhao, Q., Sheng, T., Wang, Y., Tang, Z., Chen, Y., Cai, L., Ling, H.: M2det: A single-shot object detector based on multi-level feature pyramid network. In: Proceedings of the AAAI conference on artificial intelligence, vol. 33, pp.9259\u20139266 (2019)","DOI":"10.1609\/aaai.v33i01.33019259"},{"key":"3653_CR33","doi-asserted-by":"crossref","unstructured":"Ghiasi, G., Lin, T.-Y., Le, Q.V.: Nas-fpn: Learning scalable feature pyramid architecture for object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7036\u20137045 (2019)","DOI":"10.1109\/CVPR.2019.00720"},{"key":"3653_CR34","doi-asserted-by":"crossref","unstructured":"Xu, H., Yao, L., Zhang, W., Liang, X., Li, Z.: Auto-fpn: Automatic network architecture adaptation for object detection beyond classification. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6649\u20136658 (2019)","DOI":"10.1109\/ICCV.2019.00675"},{"key":"3653_CR35","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., Le, Q.V.: Efficientdet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10781\u201310790 (2020)","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"3653_CR36","doi-asserted-by":"crossref","unstructured":"Yu, F., Koltun, V., Funkhouser, T.: Dilated residual networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 472\u2013480 (2017)","DOI":"10.1109\/CVPR.2017.75"},{"issue":"1","key":"3653_CR37","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1109\/TII.2021.3085669","volume":"18","author":"J Li","year":"2021","unstructured":"Li, J., Chen, J., Sheng, B., Li, P., Yang, P., Feng, D.D., Qi, J.: Automatic detection and classification system of domestic waste via multimodel cascaded convolutional neural network. IEEE Trans. Ind. Inf. 18(1), 163\u2013173 (2021)","journal-title":"IEEE Trans. Ind. Inf."},{"key":"3653_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102389","volume":"78","author":"S Dong","year":"2022","unstructured":"Dong, S., Pan, Z., Fu, Y., Yang, Q., Gao, Y., Yu, T., Shi, Y., Zhuo, C.: Deu-net 2.0: enhanced deformable u-net for 3d cardiac cine mri segmentation. Med. Image Anal. 78, 102389 (2022)","journal-title":"Med. Image Anal."},{"key":"3653_CR39","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1016\/j.knosys.2019.04.025","volume":"178","author":"Q Jin","year":"2019","unstructured":"Jin, Q., Meng, Z., Pham, T.D., Chen, Q., Wei, L., Su, R.: Dunet: a deformable network for retinal vessel segmentation. Knowledge-Based Syst. 178, 149\u2013162 (2019)","journal-title":"Knowledge-Based Syst."},{"issue":"11","key":"3653_CR40","doi-asserted-by":"publisher","first-page":"15593","DOI":"10.1007\/s11042-022-12418-w","volume":"81","author":"X Yang","year":"2022","unstructured":"Yang, X., Li, Z., Guo, Y., Zhou, D.: Dcu-net: a deformable convolutional neural network based on cascade u-net for retinal vessel segmentation. Multimed. Tools Appl. 81(11), 15593\u201315607 (2022)","journal-title":"Multimed. Tools Appl."},{"key":"3653_CR41","doi-asserted-by":"publisher","first-page":"3838","DOI":"10.1109\/TIP.2022.3176537","volume":"31","author":"C Zhao","year":"2022","unstructured":"Zhao, C., Zhu, W., Feng, S.: Superpixel guided deformable convolution network for hyperspectral image classification. IEEE Trans. Image Process. 31, 3838\u20133851 (2022)","journal-title":"IEEE Trans. Image Process."},{"key":"3653_CR42","doi-asserted-by":"crossref","unstructured":"Wang, D., Zhang, Z., Zhao, Z., Liu, Y., Chen, Y., Wang, L.: Pointscatter: point set representation for tubular structure extraction. In: European conference on computer vision, pp. 366\u2013383 (2022). Springer","DOI":"10.1007\/978-3-031-19803-8_22"},{"key":"3653_CR43","doi-asserted-by":"publisher","DOI":"10.1016\/j.compmedimag.2019.101688","volume":"80","author":"B Kong","year":"2020","unstructured":"Kong, B., Wang, X., Bai, J., Lu, Y., Gao, F., Cao, K., Xia, J., Song, Q., Yin, Y.: Learning tree-structured representation for 3d coronary artery segmentation. Comput. Med. Imaging Graphics 80, 101688 (2020)","journal-title":"Comput. Med. Imaging Graphics"},{"key":"3653_CR44","doi-asserted-by":"crossref","unstructured":"Jiang, N., Sheng, B., Li, P., Lee, T.-Y.: Photohelper: portrait photographing guidance via deep feature retrieval and fusion. IEEE Trans. Multimed. (2022)","DOI":"10.1109\/TMM.2022.3144890"},{"issue":"1","key":"3653_CR45","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1109\/TMI.2022.3207093","volume":"42","author":"G Zhao","year":"2022","unstructured":"Zhao, G., Liang, K., Pan, C., Zhang, F., Wu, X., Hu, X., Yu, Y.: Graph convolution based cross-network multiscale feature fusion for deep vessel segmentation. IEEE Trans. Med. Imaging 42(1), 183\u2013195 (2022)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"3653_CR46","doi-asserted-by":"crossref","unstructured":"Li, Y., Zhang, Y., Liu, J.-Y., Wang, K., Zhang, K., Zhang, G.-S., Liao, X.-F., Yang, G.: Global transformer and dual local attention network via deep-shallow hierarchical feature fusion for retinal vessel segmentation. IEEE Trans. Cybern. (2022)","DOI":"10.1109\/TCYB.2022.3194099"},{"key":"3653_CR47","doi-asserted-by":"crossref","unstructured":"Zhang, X., Zhang, J., Ma, L., Xue, P., Hu, Y., Wu, D., Zhan, Y., Feng, J., Shen, D.: Progressive deep segmentation of coronary artery via hierarchical topology learning. In: International conference on medical image computing and computer-assisted intervention, pp. 391\u2013400 (2022). Springer","DOI":"10.1007\/978-3-031-16443-9_38"},{"key":"3653_CR48","doi-asserted-by":"crossref","unstructured":"Qi, X., Yang, G., He, Y., Liu, W., Islam, A., Li, S.: Contrastive re-localization and history distillation in federated cmr segmentation. In: International conference on medical image computing and computer-assisted intervention, pp. 256\u2013265 (2022). Springer","DOI":"10.1007\/978-3-031-16443-9_25"},{"issue":"5","key":"3653_CR49","doi-asserted-by":"publisher","first-page":"2264","DOI":"10.1109\/JBHI.2021.3122581","volume":"26","author":"X Qi","year":"2021","unstructured":"Qi, X., He, Y., Yang, G., Chen, Y., Yang, J., Liu, W., Zhu, Y., Xu, Y., Shu, H., Li, S.: Mvsgan: Spatial-aware multi-view cmr fusion for accurate 3d left ventricular myocardium segmentation. IEEE J. Biomed. Health Inf. 26(5), 2264\u20132275 (2021)","journal-title":"IEEE J. Biomed. Health Inf."},{"key":"3653_CR50","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu, L., Ouyang, W., Wang, X., Fieguth, P., Chen, J., Liu, X., Pietik\u00e4inen, M.: Deep learning for generic object detection: a survey. Int. J. Comput. Vision 128, 261\u2013318 (2020)","journal-title":"Int. J. Comput. Vision"},{"key":"3653_CR51","unstructured":"Wang, A., Chen, H., Liu, L., Chen, K., Lin, Z., Han, J., Ding, G.: Yolov10: real-time end-to-end object detection. arXiv preprint arXiv:2405.14458 (2024)"},{"key":"3653_CR52","doi-asserted-by":"crossref","unstructured":"Varghese, R., Sambath, M.: Yolov8: a novel object detection algorithm with enhanced performance and robustness. In: 2024 International conference on advances in data engineering and intelligent computing systems (ADICS), pp. 1\u20136 (2024). IEEE","DOI":"10.1109\/ADICS58448.2024.10533619"},{"key":"3653_CR53","unstructured":"Ge, Z., Liu, S., Wang, F., Li, Z., Sun, J.: Yolox: Exceeding yolo series in 2021. arXiv preprint arXiv:2107.08430 (2021)"},{"key":"3653_CR54","unstructured":"Wang, C., He, W., Nie, Y., Guo, J., Liu, C., Wang, Y., Han, K.: Gold-yolo: Efficient object detector via gather-and-distribute mechanism. Adv. Neural Inf. Process. Syst. 36 (2024)"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03653-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-024-03653-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03653-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,16]],"date-time":"2025-04-16T10:20:49Z","timestamp":1744798849000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-024-03653-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,25]]},"references-count":54,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2025,4]]}},"alternative-id":["3653"],"URL":"https:\/\/doi.org\/10.1007\/s00371-024-03653-3","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9,25]]},"assertion":[{"value":"9 September 2024","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 September 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}}]}}