{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T00:05:26Z","timestamp":1773965126060,"version":"3.50.1"},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"14","license":[{"start":{"date-parts":[[2023,10,16]],"date-time":"2023-10-16T00:00:00Z","timestamp":1697414400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,10,16]],"date-time":"2023-10-16T00:00:00Z","timestamp":1697414400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["No.\u00a061602161"],"award-info":[{"award-number":["No.\u00a061602161"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61772180"],"award-info":[{"award-number":["61772180"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Hubei Province Science and Technology Support Project","award":["No:2020BAB012"],"award-info":[{"award-number":["No:2020BAB012"]}]},{"name":"The\u00a0Fundamental\u00a0Research\u00a0Funds\u00a0for\u00a0the\u00a0Research\u00a0Fund\u00a0of\u00a0Hubei\u00a0University\u00a0of\u00a0Technology","award":["HBUT:\u00a02021046"],"award-info":[{"award-number":["HBUT:\u00a02021046"]}]},{"name":"The\u00a0Fundamental\u00a0Research\u00a0Funds\u00a0for\u00a0the\u00a0Research\u00a0Fund\u00a0of\u00a0Hubei\u00a0University\u00a0of\u00a0Technology","award":["21060"],"award-info":[{"award-number":["21060"]}]},{"name":"The\u00a0Fundamental\u00a0Research\u00a0Funds\u00a0for\u00a0the\u00a0Research\u00a0Fund\u00a0of\u00a0Hubei\u00a0University\u00a0of\u00a0Technology","award":["21066"],"award-info":[{"award-number":["21066"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-023-17373-8","type":"journal-article","created":{"date-parts":[[2023,10,16]],"date-time":"2023-10-16T07:02:16Z","timestamp":1697439736000},"page":"42189-42206","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Strategies for inserting attention in computer vision"],"prefix":"10.1007","volume":"83","author":[{"given":"Jun","family":"Wu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xin","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7805-3100","authenticated-orcid":false,"given":"Jiaming","family":"Dong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,10,16]]},"reference":[{"issue":"3","key":"17373_CR1","doi-asserted-by":"publisher","first-page":"194","DOI":"10.1038\/35058500","volume":"2","author":"L Itti","year":"2001","unstructured":"Itti L, Koch C (2001) Computational modelling of visual attention[J]. Nat Rev Neurosci 2(3):194\u2013203","journal-title":"Nat Rev Neurosci"},{"key":"17373_CR2","doi-asserted-by":"crossref","unstructured":"Zhang Q, Wu YN, Zhu SC (2018) Interpretable convolutional neural networks. Proceedings of the IEEE conference on computer vision and pattern recognition(CVPR). pp. 8827\u20138836.\u00a0https:\/\/openaccess.thecvf.com\/content_cvpr_2018\/html\/Zhang_Interpretable_Convolutional_Neural_CVPR_2018_paper.html","DOI":"10.1109\/CVPR.2018.00920"},{"issue":"6","key":"17373_CR3","doi-asserted-by":"publisher","first-page":"1245","DOI":"10.1109\/TMM.2017.2648498","volume":"19","author":"B Zhao","year":"2017","unstructured":"Zhao B, Wu X, Feng J et al (2017) Diversified visual attention networks for fine-grained object classification[J]. IEEE Trans Multimedia 19(6):1245\u20131256","journal-title":"IEEE Trans Multimedia"},{"key":"17373_CR4","doi-asserted-by":"crossref","unstructured":"Wang F, Jiang M, Qian C et al (2017) Residual attention network for image classification. Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR). pp. 3156\u20133164.\u00a0https:\/\/openaccess.thecvf.com\/content_cvpr_2017\/html\/Wang_Residual_Attention_Network_CVPR_2017_paper.html","DOI":"10.1109\/CVPR.2017.683"},{"key":"17373_CR5","doi-asserted-by":"publisher","first-page":"104179","DOI":"10.1016\/j.imavis.2021.104179","volume":"110","author":"D Cores","year":"2021","unstructured":"Cores D, Brea VM, Mucientes M (2021) Short-term anchor linking and long-term self-guided attention for video object detection[J]. Image Vis Comput 110:104179","journal-title":"Image Vis Comput"},{"key":"17373_CR6","doi-asserted-by":"publisher","first-page":"126","DOI":"10.1016\/j.cag.2020.06.001","volume":"90","author":"Z Hu","year":"2020","unstructured":"Hu Z, Zhang D, Li S et al (2020) Attention-based relation and context modeling for point cloud semantic segmentation[J]. Comput Graph 90:126\u2013134","journal-title":"Comput Graph"},{"key":"17373_CR7","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.cag.2020.05.003","volume":"90","author":"C Li","year":"2020","unstructured":"Li C, Tan Y, Chen W et al (2020) ANU-Net: Attention-based Nested U-Net to exploit full resolution features for medical image segmentation[J]. Comput Graph 90:11\u201320","journal-title":"Comput Graph"},{"key":"17373_CR8","doi-asserted-by":"publisher","first-page":"104120","DOI":"10.1016\/j.imavis.2021.104120","volume":"108","author":"K Zhou","year":"2021","unstructured":"Zhou K, Hui B, Wang J et al (2021) A study on attention-based LSTM for abnormal behavior recognition with variable pooling[J]. Image Vis Comput 108:104120","journal-title":"Image Vis Comput"},{"issue":"6","key":"17373_CR9","doi-asserted-by":"publisher","first-page":"1245","DOI":"10.1109\/TMM.2017.2648498","volume":"19","author":"B Zhao","year":"2017","unstructured":"Zhao B et al (2017) Diversified visual attention networks for fine-grained object classification. IEEE Trans Multimed 19(6):1245\u20131256","journal-title":"IEEE Trans Multimed"},{"key":"17373_CR10","unstructured":"Jaderberg M, Simonyan K, Zisserman A (2015) Spatial transformer networks[J]. Advances in neural information processing systems, 28.\u00a0https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2015\/hash\/33ceb07bf4eeb3da587e268d663aba1a-Abstract.html"},{"key":"17373_CR11","unstructured":"Mai J, Xu X, Xiao G et al (2020) PGCA-Net: Progressively Aggregating Hierarchical Features with the Pyramid Guided Channel Attention for Saliency Detection[J]. Intelligent Automation & Soft Computing, 2020, 26(4).\u00a0https:\/\/pdfs.semanticscholar.org\/19aa\/a2d3dbf49005ae598f5f8cd7dc34fecb861a.pdf"},{"issue":"3","key":"17373_CR12","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1007\/s41095-022-0271-y","volume":"8","author":"MH Guo","year":"2022","unstructured":"Guo MH, Xu TX, Liu JJ et al (2022) Attention mechanisms in computer vision: A survey[J]. Comput Vis Media 8(3):331\u2013368","journal-title":"Comput Vis Media"},{"key":"17373_CR13","unstructured":"Mnih V, Heess N, Graves A (2014) Recurrent models of visual attention. Advances in neural information processing systems, 27.\u00a0https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2014\/hash\/09c6c3783b4a70054da74f2538ed47c6-Abstract.html"},{"key":"17373_CR14","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. Proceedings of the IEEE conference on computer vision and pattern recognition(CVPR). pp. 7132\u20137141.\u00a0https:\/\/openaccess.thecvf.com\/content_cvpr_2018\/html\/Hu_Squeeze-and-Excitation_Networks_CVPR_2018_paper.html","DOI":"10.1109\/CVPR.2018.00745"},{"key":"17373_CR15","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee JY et al (2018) Cbam: Convolutional block attention module. Proceedings of the European conference on computer vision (ECCV). pp. 3\u201319.\u00a0https:\/\/openaccess.thecvf.com\/content_ECCV_2018\/html\/Sanghyun_Woo_Convolutional_Block_Attention_ECCV_2018_paper.html","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"17373_CR16","doi-asserted-by":"crossref","unstructured":"Hou Q, Zhou D, Feng J (2021) Coordinate attention for efficient mobile network design. Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition(CVPR). pp. 13713\u201313722.\u00a0https:\/\/openaccess.thecvf.com\/content\/CVPR2021\/html\/Hou_Coordinate_Attention_for_Efficient_Mobile_Network_Design_CVPR_2021_paper.html","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"17373_CR17","doi-asserted-by":"crossref","unstructured":"Yang L, Zhong J, Zhang Y et al (2022) An Improving Faster-RCNN With Multi-Attention ResNet for Small Target Detection in Intelligent Autonomous Transport With 6G. in IEEE Transactions on Intelligent Transportation Systems, vol. 24, no. 7, pp. 7717-7725.\u00a0https:\/\/ieeexplore.ieee.org\/abstract\/document\/9847011","DOI":"10.1109\/TITS.2022.3193909"},{"issue":"5","key":"17373_CR18","doi-asserted-by":"publisher","first-page":"7567","DOI":"10.1007\/s11042-022-13251-x","volume":"82","author":"Y Li","year":"2023","unstructured":"Li Y, Li J, Meng P (2023) Attention-YOLOV4: a real-time and high-accurate traffic sign detection algorithm[J]. Multimedia Tools Appl 82(5):7567\u20137582","journal-title":"Multimedia Tools Appl"},{"issue":"21","key":"17373_CR19","doi-asserted-by":"publisher","first-page":"8577","DOI":"10.3390\/s22218577","volume":"22","author":"J Yao","year":"2022","unstructured":"Yao J, Fan X, Li B et al (2022) Adverse weather target detection algorithm based on adaptive color levels and improved YOLOv5[J]. Sensors 22(21):8577","journal-title":"Sensors"},{"issue":"22","key":"17373_CR20","doi-asserted-by":"publisher","first-page":"3735","DOI":"10.3390\/electronics11223735","volume":"11","author":"J Shi","year":"2022","unstructured":"Shi J, Yang J, Zhang Y (2022) Research on steel surface defect detection based on YOLOv5 with attention mechanism[J]. Electronics 11(22):3735","journal-title":"Electronics"},{"issue":"1","key":"17373_CR21","doi-asserted-by":"publisher","first-page":"2155614","DOI":"10.1080\/09540091.2022.2155614","volume":"35","author":"J Wu","year":"2023","unstructured":"Wu J, Zhu J, Tong X et al (2023) Dynamic activation and enhanced image contour features for object detection[J]. Connect Sci 35(1):2155614","journal-title":"Connect Sci"},{"issue":"1","key":"17373_CR22","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham M, Eslami SM, Van Gool L et al (2015) The pascal visual object classes challenge: a retrospective[J]. Int J Comput Vision 111(1):98\u2013136","journal-title":"Int J Comput Vision"},{"issue":"1","key":"17373_CR23","first-page":"1","volume":"14","author":"Z Zheng","year":"2017","unstructured":"Zheng Z, Zheng L, Yang Y (2017) A discriminatively learned cnn embedding for person reidentification[J]. ACM Trans Multimed Comput, Commun, Appl (TOMM) 14(1):1\u201320","journal-title":"ACM Trans Multimed Comput, Commun, Appl (TOMM)"},{"issue":"1s","key":"17373_CR24","first-page":"1","volume":"16","author":"M Tanveer","year":"2020","unstructured":"Tanveer M, Richhariya B, Khan RU et al (2020) Machine learning techniques for the diagnosis of Alzheimer\u2019s disease: a review[J]. ACM Trans Multimedia Comput, Commun, Appl (TOMM) 16(1s):1\u201335","journal-title":"ACM Trans Multimedia Comput, Commun, Appl (TOMM)"},{"key":"17373_CR25","doi-asserted-by":"crossref","unstructured":"Zheng Z, Ye R, Wang P et al (2022) Localization Distillation for Dense Object Detection. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition(CVPR). pp. 9407\u20139416.\u00a0https:\/\/openaccess.thecvf.com\/content\/CVPR2022\/html\/Zheng_Localization_Distillation_for_Dense_Object_Detection_CVPR_2022_paper.html","DOI":"10.1109\/CVPR52688.2022.00919"},{"key":"17373_CR26","doi-asserted-by":"crossref","unstructured":"Joseph KJ, Khan S, Khan FS et al (2021) Towards open world object detection. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition(CVPR) 5830\u20135840.\u00a0https:\/\/openaccess.thecvf.com\/content\/CVPR2021\/html\/Joseph_Towards_Open_World_Object_Detection_CVPR_2021_paper.html","DOI":"10.1109\/CVPR46437.2021.00577"},{"key":"17373_CR27","doi-asserted-by":"crossref","unstructured":"Chen Q, Wang Y, Yang T et al (2021) You only look one-level feature. Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition(CVPR). pp 13039\u201313048.\u00a0https:\/\/openaccess.thecvf.com\/content\/CVPR2021\/html\/Chen_You_Only_Look_One-Level_Feature_CVPR_2021_paper.html","DOI":"10.1109\/CVPR46437.2021.01284"},{"issue":"1","key":"17373_CR28","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1145\/1198302.1198305","volume":"3","author":"BT Truong","year":"2007","unstructured":"Truong BT, Venkatesh S (2007) Video abstraction: A systematic review and classification[J]. ACM Trans Multimed Comput, Commun, Appl (TOMM) 3(1):3-es","journal-title":"ACM Trans Multimed Comput, Commun, Appl (TOMM)"},{"key":"17373_CR29","doi-asserted-by":"publisher","first-page":"28347","DOI":"10.1007\/s11042-022-12715-4","volume":"81","author":"M Othmani","year":"2022","unstructured":"Othmani M (2022) A vehicle detection and tracking method for traffic video based on faster R-CNN. Multimed Tools Appl 81:28347\u201328365.\u00a0https:\/\/link.springer.com\/article\/10.1007\/s11042-022-12715-4","journal-title":"Multimed Tools Appl"},{"issue":"3","key":"17373_CR30","doi-asserted-by":"publisher","first-page":"1746","DOI":"10.3390\/app13031746","volume":"13","author":"J Wu","year":"2023","unstructured":"Wu J, Dong J, Nie W et al (2023) A lightweight YOLOv5 optimization of coordinate attention[J]. Appl Sci 13(3):1746","journal-title":"Appl Sci"},{"issue":"4","key":"17373_CR31","doi-asserted-by":"publisher","first-page":"4797","DOI":"10.1007\/s11042-021-11138-x","volume":"81","author":"S Pang","year":"2022","unstructured":"Pang S, Chen Z, Yin F (2022) Lightweight multi-scale aggregated residual attention networks for image super-resolution[J]. Multimed Tools Appl 81(4):4797\u20134819","journal-title":"Multimed Tools Appl"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-17373-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-17373-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-17373-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,4]],"date-time":"2024-04-04T13:53:37Z","timestamp":1712238817000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-17373-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,16]]},"references-count":31,"journal-issue":{"issue":"14","published-online":{"date-parts":[[2024,4]]}},"alternative-id":["17373"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-17373-8","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,10,16]]},"assertion":[{"value":"26 June 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 May 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 October 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 October 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}