{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,2]],"date-time":"2026-03-02T00:16:31Z","timestamp":1772410591114,"version":"3.50.1"},"reference-count":69,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2024,7,17]],"date-time":"2024-07-17T00:00:00Z","timestamp":1721174400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,7,17]],"date-time":"2024-07-17T00:00:00Z","timestamp":1721174400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["U22A2012, 62173098, 62104047"],"award-info":[{"award-number":["U22A2012, 62173098, 62104047"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Guangdong Provincial Key Laboratory of Cyber-Physical System","award":["2020B1212060069"],"award-info":[{"award-number":["2020B1212060069"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2024,8]]},"DOI":"10.1007\/s00530-024-01410-z","type":"journal-article","created":{"date-parts":[[2024,7,17]],"date-time":"2024-07-17T09:01:55Z","timestamp":1721206915000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":19,"title":["Underwater small and occlusion object detection with feature fusion and global context decoupling head-based YOLO"],"prefix":"10.1007","volume":"30","author":[{"given":"Lei","family":"Deng","sequence":"first","affiliation":[]},{"given":"Shaojuan","family":"Luo","sequence":"additional","affiliation":[]},{"given":"Chunhua","family":"He","sequence":"additional","affiliation":[]},{"given":"Huapan","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Heng","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,17]]},"reference":[{"issue":"9","key":"1410_CR1","doi-asserted-by":"publisher","first-page":"959","DOI":"10.3390\/electronics8090959","volume":"8","author":"L Qi","year":"2019","unstructured":"Qi, L., Li, B., Chen, L., Wang, W., Dong, L., Jia, X., Huang, J., Ge, C., Xue, G., Wang, D.: Ship target detection algorithm based on improved faster R-CNN. Electronics 8(9), 959 (2019)","journal-title":"Electronics"},{"key":"1410_CR2","doi-asserted-by":"crossref","unstructured":"Yang, P., Yu, Y., Yao, P.: An Automatic Detection System for Marine Ranch Biological Targets Based on Deep Learning. In: 2021 3rd International Conference on Machine Learning, Big Data and Business Intelligence (MLBDBI), pp. 696\u2013699. IEEE (2021)","DOI":"10.1109\/MLBDBI54094.2021.00137"},{"issue":"9","key":"1410_CR3","doi-asserted-by":"publisher","first-page":"3335","DOI":"10.3390\/s22093335","volume":"22","author":"R Chen","year":"2022","unstructured":"Chen, R., Li, T., Memon, I., Shi, Y., Ullah, I., Memon, S.A.: Multi-sonar distributed fusion for target detection and tracking in marine environment. Sensors 22(9), 3335 (2022)","journal-title":"Sensors"},{"issue":"3","key":"1410_CR4","doi-asserted-by":"publisher","first-page":"677","DOI":"10.3390\/jmse11030677","volume":"11","author":"K Liu","year":"2023","unstructured":"Liu, K., Sun, Q., Sun, D., Peng, L., Yang, M., Wang, N.: Underwater target detection based on improved YOLOv7. J. Mar. Sci. Eng. 11(3), 677 (2023)","journal-title":"J. Mar. Sci. Eng."},{"key":"1410_CR5","unstructured":"Eken, \u0130.C., \u00c7etin, Y.Y.: Underwater target detection with hyperspectral imagery for search and rescue missions. In: Algorithms and Technologies for Multispectral"},{"key":"1410_CR6","doi-asserted-by":"publisher","first-page":"759","DOI":"10.1016\/j.procs.2020.01.015","volume":"165","author":"R Priyadharsini","year":"2019","unstructured":"Priyadharsini, R., Sharmila, T.S.: Object detection in underwater acoustic images using edge based segmentation method. Procedia Comput. Sci. 165, 759\u2013765 (2019)","journal-title":"Procedia Comput. Sci."},{"issue":"4","key":"1410_CR7","first-page":"293","volume":"224","author":"Y Petillot","year":"2010","unstructured":"Petillot, Y., Maurelli, F., Valeyrie, N., Mallios, A., Ridao, P., Aulinas, J., Salvi, J.: Acoustic-based techniques for autonomous underwater vehicle localization. Proc. Inst. Mech. Eng. Part M: J. Eng. Marit. Environ. 224(4), 293\u2013307 (2010)","journal-title":"Proc. Inst. Mech. Eng. Part M: J. Eng. Marit. Environ."},{"key":"1410_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.comnet.2020.107447","volume":"181","author":"Y Bai","year":"2020","unstructured":"Bai, Y., Lu, L., Cheng, J., Liu, J., Chen, Y., Yu, J.: Acoustic-based sensing and applications: a survey. Comput. Netw. 181, 107447 (2020)","journal-title":"Comput. Netw."},{"issue":"2","key":"1410_CR9","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1109\/TETCI.2024.3349464","volume":"8","author":"J Zhang","year":"2024","unstructured":"Zhang, J., Lv, Y., Tao, J., Huang, F., Zhang, J.: A robust real-time anchor-free traffic sign detector with one-level feature. IEEE Trans. Emerg. Top. Comput. Intell. 8(2), 1437\u20131451 (2024)","journal-title":"IEEE Trans. Emerg. Top. Comput. Intell."},{"key":"1410_CR10","doi-asserted-by":"publisher","first-page":"5","DOI":"10.22967\/HCIS.2022.12.023","volume":"7","author":"J Zhang","year":"2022","unstructured":"Zhang, J., Zou, X., Kuang, L., Wang, J., Sherratt, R.S., Yu, X.: CCTSDB a more comprehensive traffic sign detection benchmark. Human-Centric Comput. Inf. Sci. 7, 5 (2022). https:\/\/doi.org\/10.22967\/HCIS.2022.12.023","journal-title":"Human-Centric Comput. Inf. Sci."},{"key":"1410_CR11","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1016\/j.neunet.2023.12.008","volume":"171","author":"X Kong","year":"2024","unstructured":"Kong, X., Yu, F., Yao, W., Cai, S., Zhang, J., Lin, H.: Memristor-induced hyperchaos, multiscroll and extreme multistability in fractional-order HNN: Image encryption and FPGA implementation. Neural Netw. 171, 85\u2013103 (2024)","journal-title":"Neural Netw."},{"key":"1410_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.123111","volume":"245","author":"Y Chen","year":"2024","unstructured":"Chen, Y., Xia, R., Yang, K., Zou, K.: MICU: Image super-resolution via multi-level information compensation and U-net. Expert Syst. Appl. 245, 123111 (2024)","journal-title":"Expert Syst. Appl."},{"issue":"4","key":"1410_CR13","doi-asserted-by":"publisher","first-page":"317","DOI":"10.3233\/AIS-220038","volume":"14","author":"J Zhang","year":"2022","unstructured":"Zhang, J., Zheng, Z., Xie, X., Gui, Y., Kim, G.: ReYOLO: a traffic sign detector based on network reparameterization and features adaptive weighting. J. Ambient Intell. Smart Environ. 14(4), 317\u2013334 (2022)","journal-title":"J. Ambient Intell. Smart Environ."},{"issue":"12","key":"1410_CR14","doi-asserted-by":"publisher","first-page":"4861","DOI":"10.1109\/TCSVT.2019.2963772","volume":"30","author":"R Liu","year":"2020","unstructured":"Liu, R., Fan, X., Zhu, M., Hou, M., Luo, Z.: Real-world underwater enhancement: challenges, benchmarks, and solutions under natural light. IEEE Trans. Circuits Syst. Video Technol. 30(12), 4861\u20134875 (2020)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"1410_CR15","doi-asserted-by":"crossref","unstructured":"Lourens, J. G.: Classification of ships using underwater radiated noise. In: COMSIG 88@ m_Southern African Conference on Communications and Signal Processing. Proceedings, pp. 130\u2013134. IEEE (1988)","DOI":"10.1109\/COMSIG.1988.49315"},{"issue":"4","key":"1410_CR16","doi-asserted-by":"publisher","first-page":"2242","DOI":"10.1121\/1.4920186","volume":"137","author":"Q Meng","year":"2015","unstructured":"Meng, Q., Yang, S.: A wave structure based method for recognition of marine acoustic target signals. J. Acoust. Soc. America 137(4), 2242 (2015)","journal-title":"J. Acoust. Soc. America"},{"issue":"6","key":"1410_CR17","doi-asserted-by":"publisher","first-page":"1738133683","DOI":"10.1177\/1729881420976307","volume":"17","author":"B Teng","year":"2020","unstructured":"Teng, B., Zhao, H.: Underwater target recognition methods based on the framework of deep learning: a survey. Int. J. Adv. Robot. Syst. 17(6), 1738133683 (2020)","journal-title":"Int. J. Adv. Robot. Syst."},{"issue":"3","key":"1410_CR18","doi-asserted-by":"publisher","first-page":"310","DOI":"10.3390\/jmse10030310","volume":"10","author":"F Lei","year":"2022","unstructured":"Lei, F., Tang, F., Li, S.: Underwater target detection algorithm based on improved YOLOv5. J. Mar. Sci. Eng. 10(3), 310 (2022)","journal-title":"J. Mar. Sci. Eng."},{"key":"1410_CR19","doi-asserted-by":"crossref","unstructured":"Moniruzzaman, M., Islam, S.M.S., Bennamoun, M., Lavery, P.: Deep learning on underwater marine object detection: a survey. In: Advanced Concepts for Intelligent Vision Systems: 18th International Conference, ACIVS 2017, Antwerp, Belgium, September 18\u201321, 2017, Proceedings 18, pp. 150\u2013160. Springer (2017)","DOI":"10.1007\/978-3-319-70353-4_13"},{"issue":"6","key":"1410_CR20","doi-asserted-by":"publisher","first-page":"1155","DOI":"10.1007\/s11554-022-01252-w","volume":"19","author":"J Zhang","year":"2022","unstructured":"Zhang, J., Ye, Z.I., Jin, X., Wang, J., Zhang, J.: Real-time traffic sign detection based on multiscale attention and spatial information aggregator. J. Real-Time Image Process. 19(6), 1155\u20131167 (2022)","journal-title":"J. Real-Time Image Process."},{"key":"1410_CR21","doi-asserted-by":"publisher","first-page":"29742","DOI":"10.1109\/ACCESS.2020.2972338","volume":"8","author":"J Zhang","year":"2020","unstructured":"Zhang, J., Xie, Z., Sun, J., Zou, X., Wang, J.: A cascaded R-CNN with multiscale attention and imbalanced samples for traffic sign detection. IEEE Access 8, 29742\u201329754 (2020)","journal-title":"IEEE Access"},{"key":"1410_CR22","doi-asserted-by":"crossref","unstructured":"Liang, X., Song, P.: Excavating roi attention for underwater object detection. In: 2022 IEEE International Conference on Image Processing (ICIP), pp. 2651\u20132655. IEEE (2022)","DOI":"10.1109\/ICIP46576.2022.9897515"},{"key":"1410_CR23","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"1410_CR24","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"1410_CR25","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems 28 (2015)"},{"key":"1410_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"1410_CR27","doi-asserted-by":"crossref","unstructured":"Cai, Z., Vasconcelos, N.: Cascade r-cnn: Delving into high quality object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 6154\u20136162 (2018)","DOI":"10.1109\/CVPR.2018.00644"},{"key":"1410_CR28","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C., Berg, A.C.: Ssd: Single shot multibox detector. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 21\u201337, Springer (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"1410_CR29","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: Unified, real-time object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"issue":"5","key":"1410_CR30","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1109\/MCE.2021.3096376","volume":"11","author":"QM Ul Haq","year":"2021","unstructured":"Ul Haq, Q.M., Ruan, S., Haq, M.A., Karam, S., Shieh, J.L., Chondro, P., Gao, D.: An incremental learning of YOLOv3 without catastrophic forgetting for smart city applications. IEEE Consum. Electron. Mag. 11(5), 56\u201363 (2021)","journal-title":"IEEE Consum. Electron. Mag."},{"key":"1410_CR31","doi-asserted-by":"crossref","unstructured":"Wang, C., Bochkovskiy, A., Liao, H.M.: YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7464\u20137475 (2023)","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"1410_CR32","unstructured":"Ge, Z., Liu, S., Wang, F., Li, Z., Sun, J.: Yolox: Exceeding yolo series in 2021. arXiv preprint arXiv:2107.08430 (2021)"},{"key":"1410_CR33","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1016\/j.neucom.2018.10.089","volume":"391","author":"Z Chen","year":"2020","unstructured":"Chen, Z., Gao, H., Zhang, Z., Zhou, H., Wang, X., Tian, Y.: Underwater salient object detection by combining 2D and 3D visual features. Neurocomputing 391, 249\u2013259 (2020)","journal-title":"Neurocomputing"},{"key":"1410_CR34","unstructured":"Chen, L., Zhou, F., Wang, S., Dong, J., Li, N., Ma, H., Wang, X., Zhou, H.: SWIPENET: Object detection in noisy underwater images, arXiv preprint arXiv:2010.10006 (2020)"},{"key":"1410_CR35","doi-asserted-by":"crossref","unstructured":"Lin, W., Zhong, J., Liu, S., Li, T., Li, G.: Roimix: Proposal-fusion among multiple images for underwater object detection. In: ICASSP 2020\u20132020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2588\u20132592. IEEE (2020)","DOI":"10.1109\/ICASSP40776.2020.9053829"},{"key":"1410_CR36","doi-asserted-by":"crossref","unstructured":"Lin, T., Goyal, P., Girshick, R., He, K., Doll\u00e1r, P.: Focal loss for dense object detection. In: Proceedings of the IEEE international conference on computer vision, pp. 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"key":"1410_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2020.108415","volume":"219","author":"W Qiao","year":"2021","unstructured":"Qiao, W., Khishe, M., Ravakhah, S.: Underwater targets classification using local wavelet acoustic pattern and multi-layer perceptron neural network optimized by modified whale optimization algorithm. Ocean Eng. 219, 108415 (2021)","journal-title":"Ocean Eng."},{"key":"1410_CR38","doi-asserted-by":"crossref","unstructured":"Fan, B., Chen, W., Cong, Y., Tian, J.: Dual refinement underwater object detection network. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XX 16, pp. 275\u2013291. Springer (2020)","DOI":"10.1007\/978-3-030-58565-5_17"},{"key":"1410_CR39","doi-asserted-by":"publisher","first-page":"150","DOI":"10.1016\/j.neucom.2023.01.088","volume":"530","author":"P Song","year":"2023","unstructured":"Song, P., Li, P., Dai, L., Wang, T., Chen, Z.: Boosting R-CNN: reweighting R-CNN samples by RPN\u2019s error for underwater object detection. Neurocomputing 530, 150\u2013164 (2023)","journal-title":"Neurocomputing"},{"issue":"17","key":"1410_CR40","doi-asserted-by":"publisher","first-page":"14881","DOI":"10.1007\/s00521-022-07264-8","volume":"34","author":"F Xu","year":"2022","unstructured":"Xu, F., Wang, H., Sun, X., Fu, X.: Refined marine object detector with attention-based spatial pyramid pooling networks and bidirectional feature fusion strategy. Neural Comput. Appl. 34(17), 14881\u201314894 (2022)","journal-title":"Neural Comput. Appl."},{"key":"1410_CR41","doi-asserted-by":"publisher","first-page":"3637","DOI":"10.1007\/s00521-020-05217-7","volume":"33","author":"F Xu","year":"2021","unstructured":"Xu, F., Wang, H., Peng, J., Fu, X.: Scale-aware feature pyramid architecture for marine object detection. Neural Comput. Appl. 33, 3637\u20133653 (2021)","journal-title":"Neural Comput. Appl."},{"key":"1410_CR42","doi-asserted-by":"crossref","unstructured":"Qi, S., Du, J., Wu, M., Yi, H., Tang, L., Qian, T., Wang, X.: Underwater small target detection based on deformable convolutional pyramid. In: ICASSP 2022\u20132022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2784\u20132788. IEEE (2022)","DOI":"10.1109\/ICASSP43922.2022.9746575"},{"key":"1410_CR43","first-page":"1","volume":"60","author":"T Zhou","year":"2022","unstructured":"Zhou, T., Si, J., Wang, L., Xu, C., Yu, X.: Automatic detection of underwater small targets using forward-looking sonar images. IEEE Trans. Geosci. Remote Sens. 60, 1\u201312 (2022)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"1410_CR44","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2021.104190","volume":"100","author":"L Zeng","year":"2021","unstructured":"Zeng, L., Sun, B., Zhu, D.: Underwater target detection based on Faster R-CNN and adversarial occlusion network. Eng. Appl. Artif. Intell. 100, 104190 (2021)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"1410_CR45","doi-asserted-by":"crossref","unstructured":"Chen, L., Liu, Z., Tong, L., Jiang, Z., Wang, S., Dong, J., Zhou, H., Underwater object detection using Invert Multi-Class Adaboost with deep learning. In: 2020 International Joint Conference on Neural Networks (IJCNN), pp. 1\u20138. IEEE (2020)","DOI":"10.1109\/IJCNN48605.2020.9207506"},{"key":"1410_CR46","doi-asserted-by":"crossref","unstructured":"Cai, Z., Fan, Q., Feris, R.S., Vasconcelos, N.: A unified multi-scale deep convolutional neural network for fast object detection. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part IV 14, pp. 354\u2013370. Springer (2016)","DOI":"10.1007\/978-3-319-46493-0_22"},{"key":"1410_CR47","doi-asserted-by":"crossref","unstructured":"Lin, T., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"1410_CR48","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path aggregation network for instance segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"issue":"4","key":"1410_CR49","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"L Chen","year":"2017","unstructured":"Chen, L., Papandreou, G., Kokkinos, I., Murphy, K., Yuille, A.L.: Deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE Trans. Pattern Anal. Mach. Intell. 40(4), 834\u2013848 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1410_CR50","doi-asserted-by":"crossref","unstructured":"Ghiasi, G., Lin, T., Le, Q.V.: Nas-fpn: Learning scalable feature pyramid architecture for object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7036\u20137045 (2019)","DOI":"10.1109\/CVPR.2019.00720"},{"key":"1410_CR51","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., Le, Q.V.: Efficientdet: Scalable and efficient object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10781\u201310790 (2020)","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"1410_CR52","doi-asserted-by":"crossref","unstructured":"Liu, Y., Wang, Y., Wang, S., Liang, T., Zhao, Q., Tang, Z., Ling, H.: Cbnet: A novel composite backbone network architecture for object detection. In: Proceedings of the AAAI conference on artificial intelligence, pp. 11653\u201311660 (2020)","DOI":"10.1609\/aaai.v34i07.6834"},{"key":"1410_CR53","doi-asserted-by":"crossref","unstructured":"Qiao, S., Chen, L., Yuille, A.: Detectors: Detecting objects with recursive feature pyramid and switchable atrous convolution. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10213\u201310224 (2021)","DOI":"10.1109\/CVPR46437.2021.01008"},{"key":"1410_CR54","unstructured":"Liu, S., Huang, D., Wang, Y.: Learning spatial fusion for single-shot object detection, arXiv preprint arXiv:1911.09516 (2019)"},{"key":"1410_CR55","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: European conference on computer vision, pp. 213\u2013229. Springer (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"1410_CR56","unstructured":"Li, C., Li, L., Jiang, H., Weng, K., Geng, Y., Li, L., Ke, Z., Li, Q., Cheng, M., Nie, W.: YOLOv6: A single-stage object detection framework for industrial applications, arXiv preprint arXiv:2209.02976 (2022)"},{"key":"1410_CR57","unstructured":"Bochkovskiy, A., Wang, C., Liao, H.M.: Yolov4: Optimal speed and accuracy of object detection, arXiv preprint arXiv:2004.10934 (2020)"},{"key":"1410_CR58","doi-asserted-by":"crossref","unstructured":"Wang, C., Liao, H.M., Wu, Y., Chen, P., Hsieh, J., Yeh, I.: CSPNet: A new backbone that can enhance learning capability of CNN. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition workshops, pp. 390\u2013391 (2020)","DOI":"10.1109\/CVPRW50498.2020.00203"},{"key":"1410_CR59","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J., Kweon, I.S.: Cbam: Convolutional block attention module. In: Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"issue":"3","key":"1410_CR60","doi-asserted-by":"publisher","first-page":"1415","DOI":"10.1007\/s00371-023-02858-2","volume":"40","author":"X Shen","year":"2023","unstructured":"Shen, X., Wang, H., Cui, T., Guo, Z., Fu, X.: Multiple information perception-based attention in YOLO for underwater object detection. Vis. Comput. 40(3), 1415\u20131438 (2023)","journal-title":"Vis. Comput."},{"issue":"7","key":"1410_CR61","doi-asserted-by":"publisher","first-page":"3367","DOI":"10.3390\/s23073367","volume":"23","author":"G Wen","year":"2023","unstructured":"Wen, G., Li, S., Liu, F., Luo, X., Er, M., Mahmud, M., Wu, T.: YOLOv5s-CA: a modified YOLOv5s network with coordinate attention for underwater target detection. Sensors 23(7), 3367 (2023)","journal-title":"Sensors"},{"key":"1410_CR62","doi-asserted-by":"crossref","unstructured":"Ouyang, W., Wei, Y., Wang, D.: YOLOX-DC: A small target detection network up to underwater scenes. In: OCEANS 2022, Hampton Roads, pp. 1\u20136. IEEE (2022)","DOI":"10.1109\/OCEANS47191.2022.9977017"},{"key":"1410_CR63","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need. In: Advances in neural information processing systems 30 (2017)"},{"key":"1410_CR64","doi-asserted-by":"crossref","unstructured":"Wang, X., Girshick, R., Gupta, A., He, K.: Non-local neural networks. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 7794\u20137803 (2018)","DOI":"10.1109\/CVPR.2018.00813"},{"key":"1410_CR65","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 7132\u20137141 (2018)","DOI":"10.1109\/CVPR.2018.00745"},{"key":"1410_CR66","doi-asserted-by":"crossref","unstructured":"Noh, H., Hong, S., Han, B.: Learning deconvolution network for semantic segmentation. In: Proceedings of the IEEE international conference on computer vision, pp. 1520\u20131528 (2015)","DOI":"10.1109\/ICCV.2015.178"},{"key":"1410_CR67","doi-asserted-by":"crossref","unstructured":"Shi, W., Caballero, J., Husz\u00e1r, F., Totz, J., Aitken, A.P., Bishop, R., Rueckert, D., Wang, Z.: Real-time single image and video super-resolution using an efficient sub-pixel convolutional neural network. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 1874\u20131883 (2016)","DOI":"10.1109\/CVPR.2016.207"},{"key":"1410_CR68","doi-asserted-by":"crossref","unstructured":"Wang, J., Chen, K., Xu, R., Liu, Z., Loy, C.C., Lin, D.: Carafe: Content-aware reassembly of features. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 3007\u20133016 (2019)","DOI":"10.1109\/ICCV.2019.00310"},{"key":"1410_CR69","unstructured":"Chang, D.: CDNet is all you need: Cascade DCN based underwater object detection RCNN. arXiv preprint arXiv:2111.12982 (2021)"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01410-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-024-01410-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01410-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,24]],"date-time":"2024-11-24T08:01:39Z","timestamp":1732435299000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-024-01410-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,17]]},"references-count":69,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,8]]}},"alternative-id":["1410"],"URL":"https:\/\/doi.org\/10.1007\/s00530-024-01410-z","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7,17]]},"assertion":[{"value":"23 January 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 July 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 July 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflicts of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"208"}}