{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T22:39:39Z","timestamp":1772750379277,"version":"3.50.1"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2022,9,15]],"date-time":"2022-09-15T00:00:00Z","timestamp":1663200000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,9,15]],"date-time":"2022-09-15T00:00:00Z","timestamp":1663200000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61971078"],"award-info":[{"award-number":["61971078"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61501070"],"award-info":[{"award-number":["61501070"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007957","name":"Chongqing Municipal Education Commission","doi-asserted-by":"publisher","award":["CYS21478"],"award-info":[{"award-number":["CYS21478"]}],"id":[{"id":"10.13039\/501100007957","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2023,2]]},"DOI":"10.1007\/s00530-022-00995-7","type":"journal-article","created":{"date-parts":[[2022,9,15]],"date-time":"2022-09-15T03:30:25Z","timestamp":1663212625000},"page":"323-332","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Development of outdoor swimmers detection system with small object detection method based on deep learning"],"prefix":"10.1007","volume":"29","author":[{"given":"Hanguang","family":"Xiao","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5192-6717","authenticated-orcid":false,"given":"Yuewei","family":"Li","sequence":"additional","affiliation":[]},{"given":"Yu","family":"Xiu","sequence":"additional","affiliation":[]},{"given":"Qingling","family":"Xia","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,9,15]]},"reference":[{"key":"995_CR1","doi-asserted-by":"publisher","unstructured":"Chatterjee, R., Chatterjee, A., Islam, S., Khan, M.K.: An object detection-based few-shot learning approach for multimedia quality assessment. Multimed. Syst. 1\u201314 (2022). https:\/\/doi.org\/10.1007\/s00530-021-00881-8. Accessed 29 Jan 2022","DOI":"10.1007\/s00530-021-00881-8"},{"issue":"6","key":"995_CR2","doi-asserted-by":"publisher","first-page":"2523","DOI":"10.1007\/s42835-019-00255-1","volume":"14","author":"SD Chua","year":"2019","unstructured":"Chua, S.D., Lim, S., Lai, S., Chang, T.: Development of a child detection system with artificial intelligence using object detection method. J. Electr. Eng. Technol. 14(6), 2523\u20132529 (2019)","journal-title":"J. Electr. Eng. Technol."},{"key":"995_CR3","unstructured":"Zou, Z., Shi, Z., Guo, Y., Ye J.: Object detection in 20 years: a survey. (2019). arXiv preprint arXiv:1905.05055"},{"issue":"4","key":"995_CR4","first-page":"4186","volume":"6","author":"A Vahab","year":"2019","unstructured":"Vahab, A., Naik, M.S., Raikar, P.G.: Applications of object detection system. Int. Res. J. Eng. Technol. 6(4), 4186\u20134192 (2019)","journal-title":"Int. Res. J. Eng. Technol."},{"key":"995_CR5","doi-asserted-by":"crossref","unstructured":"Pranav, M V., Shreyas Madhav, A V., Meena, J.: DeepRecog: threefold underwater image deblurring and object recognition framework for AUV vision systems. Multimed. Syst. 28(2), 583\u2013593 (2021)","DOI":"10.1007\/s00530-021-00851-0"},{"key":"995_CR6","doi-asserted-by":"crossref","unstructured":"Heo, S., Cho, S., Kim, Y.: Real-time object detection system with multi-path neural networks. In: 2020 IEEE Real-Time and Embedded Technology and Applications Symposium (RTAS), pp. 174\u2013187 (2020)","DOI":"10.1109\/RTAS48715.2020.000-8"},{"key":"995_CR7","doi-asserted-by":"publisher","first-page":"114602","DOI":"10.1016\/j.eswa.2021.114602","volume":"172","author":"Y Liu","year":"2021","unstructured":"Liu, Y., Sun, P., Wergeles, N.: A survey and performance evaluation of deep learning methods for small object detection. Expert Syst. Appl. 172, 114602 (2021)","journal-title":"Expert Syst. Appl."},{"issue":"2","key":"995_CR8","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1023\/B:VISI.0000013087.49260.fb","volume":"57","author":"P Viola","year":"2004","unstructured":"Viola, P., Jones, M.J.: Robust real-time face detection. Int. J. Comput. Vis. 57(2), 137\u2013154 (2004)","journal-title":"Int. J. Comput. Vis."},{"key":"995_CR9","doi-asserted-by":"crossref","unstructured":"Dalal, N., Triggs, B.: Histograms of oriented gradients for human detection. In: 2005 IEEE computer society conference on computer vision and pattern recognition (CVPR\u201905), pp. 886\u2013893 (2005)","DOI":"10.1109\/CVPR.2005.177"},{"issue":"5","key":"995_CR10","doi-asserted-by":"publisher","first-page":"694","DOI":"10.1109\/TPAMI.2006.104","volume":"28","author":"Z Sun","year":"2006","unstructured":"Sun, Z., Bebis, G., Miller, R.: On-road vehicle detection: a review. IEEE Trans. Pattern Anal. Mach. Intell. 28(5), 694\u2013711 (2006)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"995_CR11","unstructured":"Eng, H.-L., Wang, J., Kam, A. H., Yau, W.-Y.: Novel region-based modeling for human detection within highly dynamic aquatic environment. In: Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u2019 04), p. II (2004)"},{"issue":"6","key":"995_CR12","doi-asserted-by":"publisher","first-page":"1583","DOI":"10.1109\/TIP.2006.871119","volume":"15","author":"H-L Eng","year":"2006","unstructured":"Eng, H.-L., Wang, J., Wah, A.S., Yau, W.-Y.: Robust human detection within a highly dynamic aquatic environment in real time. IEEE Trans. Image Process. 15(6), 1583\u20131600 (2006)","journal-title":"IEEE Trans. Image Process."},{"key":"#cr-split#-995_CR13.1","doi-asserted-by":"crossref","unstructured":"Zecha, D., Greif, T., Lienhart, R.: Swimmer detection and pose estimation for continuous stroke-rate determination. In: Multimedia on Mobile Devices 2012","DOI":"10.1117\/12.908309"},{"key":"#cr-split#-995_CR13.2","unstructured":"and Multimedia Content Access: Algorithms and Systems VI, p. 830410 (2012)"},{"issue":"2","key":"995_CR14","doi-asserted-by":"publisher","first-page":"196","DOI":"10.1109\/TCSVT.2007.913960","volume":"18","author":"H-L Eng","year":"2008","unstructured":"Eng, H.-L., Toh, K.-A., Yau, W.-Y., Wang, J.: DEWS: a live visual surveillance system for early drowning detection at pool. IEEE Trans. Circuits Syst. Video Technol. 18(2), 196\u2013210 (2008)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"1","key":"995_CR15","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/s00138-012-0419-3","volume":"24","author":"KL Chan","year":"2013","unstructured":"Chan, K.L.: Detection of swimmer using dense optical flow motion map and intensity information. Mach. Vis. Appl. 24(1), 75\u2013101 (2013)","journal-title":"Mach. Vis. Appl."},{"issue":"12","key":"995_CR16","first-page":"79","volume":"22","author":"D Hong","year":"2017","unstructured":"Hong, D., Kim, Y.: Efficient swimmer detection algorithm using CNN-based SVM. J. Korean Inf. Sci. Soc. 22(12), 79\u201385 (2017)","journal-title":"J. Korean Inf. Sci. Soc."},{"key":"995_CR17","doi-asserted-by":"publisher","first-page":"103910","DOI":"10.1016\/j.imavis.2020.103910","volume":"97","author":"K Tong","year":"2020","unstructured":"Tong, K., Wu, Y., Zhou, F.: Recent advances in small object detection based on deep learning: a review. Image Vis. Comput. 97, 103910 (2020)","journal-title":"Image Vis. Comput."},{"key":"995_CR18","doi-asserted-by":"publisher","first-page":"53040","DOI":"10.1109\/ACCESS.2019.2912200","volume":"7","author":"A Shrestha","year":"2019","unstructured":"Shrestha, A., Mahmood, A.: Review of deep learning algorithms and architectures. IEEE Access 7, 53040\u201353065 (2019)","journal-title":"IEEE Access"},{"key":"995_CR19","unstructured":"Shrivastava, A., Sukthankar, R., Malik, J., Gupta, A.: Beyond skip connections: top-down modulation for object detection. (2016). arXiv preprint arXiv:06851"},{"key":"995_CR20","doi-asserted-by":"crossref","unstructured":"Bell, S., Zitnick, C. L., Bala, K., Girshick, R.: Inside\u2013outside net: detecting objects in context with skip pooling and recurrent neural network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2874\u20132883 (2016)","DOI":"10.1109\/CVPR.2016.314"},{"key":"995_CR21","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"995_CR22","unstructured":"Dai, J., Li, Y., He, K., Sun, J.: R-fcn: object detection via region-based fully convolutional networks. (2016). arXiv preprint arXiv:06409"},{"key":"995_CR23","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask r-cnn. In: Proceedings of the Ieee International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"issue":"7","key":"995_CR24","doi-asserted-by":"publisher","first-page":"1476","DOI":"10.1109\/TPAMI.2016.2601099","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren, S., He, K., Girshick, R., Zhang, X., Sun, J.: Object detection networks on convolutional feature maps. IEEE Trans. Pattern Anal. Mach. Intell. 39(7), 1476\u20131481 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"995_CR25","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: towards real-time object detection with region proposal networks. (2015). arXiv preprint arXiv:01497"},{"key":"995_CR26","doi-asserted-by":"crossref","unstructured":"Yang, F., Choi, W., Lin, Y.: Exploit all the layers: fast and accurate cnn object detector with scale dependent pooling and cascaded rejection classifiers. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2129\u20132137 (2016)","DOI":"10.1109\/CVPR.2016.234"},{"issue":"19","key":"995_CR27","doi-asserted-by":"publisher","first-page":"6391","DOI":"10.3390\/s21196391","volume":"21","author":"H Deng","year":"2021","unstructured":"Deng, H., Ergu, D., Liu, F., Ma, B., Cai, Y.: An embeddable algorithm for automatic garbage detection based on complex marine environment. Sensors 21(19), 6391 (2021)","journal-title":"Sensors"},{"key":"995_CR28","unstructured":"Li, X., Shang, M., Qin, H., Chen, L.: Fast accurate fish detection and recognition of underwater images with fast r-cnn. In: OCEANS 2015-MTS\/IEEE Washington, pp. 1\u20135 (2015)"},{"key":"995_CR29","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"995_CR30","doi-asserted-by":"crossref","unstructured":"Redmon, J., Farhadi, A.: YOLO9000: better, faster, stronger. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7263\u20137271 (2017)","DOI":"10.1109\/CVPR.2017.690"},{"key":"995_CR31","unstructured":"Redmon, J., Farhadi, A.: Yolov3: An incremental improvement. (2018). arXiv preprint arXiv:02767"},{"key":"995_CR32","unstructured":"Bochkovskiy, A., Wang, C.-Y., Liao, H.-Y. M.: Yolov4: optimal speed and accuracy of object detection. (2020). arXiv preprint arXiv:10934"},{"key":"995_CR33","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"995_CR34","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A. C.: Ssd: single shot multibox detector. In: European Conference on Computer Vision, pp. 21\u201337 (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"995_CR35","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., Zitnick, C.L.: Microsoft coco: common objects in context. In: European Conference on Computer Vision, pp. 740\u2013755 (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"995_CR36","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"9","key":"995_CR37","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9), 1904\u20131916 (2015)","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"995_CR38","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path aggregation network for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"key":"995_CR39","doi-asserted-by":"publisher","unstructured":"Misra, D.: Mish: a self regularized non-monotonic neural activation function. (2019). https:\/\/doi.org\/10.48550\/arXiv.1908.08681. arXiv:1605.06409","DOI":"10.48550\/arXiv.1908.08681"},{"key":"995_CR40","doi-asserted-by":"crossref","unstructured":"Xu, J., Li, Z., Du, B.: Reluplex made more practical: leaky ReLU. In: 2020 IEEE Symposium on Computers and Communications (ISCC), pp. 1\u20137 (2020)","DOI":"10.1109\/ISCC50000.2020.9219587"},{"key":"995_CR41","doi-asserted-by":"publisher","unstructured":"Ghiasi, G., Lin, T.-Y., Le, Q. V.: Dropblock: a regularization method for convolutional networks. (2018). https:\/\/doi.org\/10.48550\/arXiv.1810.12890. arXiv:1810.12890","DOI":"10.48550\/arXiv.1810.12890"},{"issue":"1","key":"995_CR42","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.: Dropout: a simple way to prevent neural networks from overfitting. J. Mach. Learn. Res. 15(1), 1929\u20131958 (2014)","journal-title":"J. Mach. Learn. Res."},{"issue":"4","key":"995_CR43","first-page":"985","volume":"20","author":"J Li","year":"2017","unstructured":"Li, J., Liang, X., Shen, S., Xu, T., Feng, J., Yan, S.: Scale-aware fast R-CNN for pedestrian detection. IEEE Trans. Multimed. 20(4), 985\u2013996 (2017)","journal-title":"IEEE Trans. Multimed."},{"issue":"2","key":"995_CR44","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Van Gool, L., Williams, C.K., Winn, J., Zisserman, A.: The pascal visual object classes (voc) challenge. Int. J. Comput. Vis. 88(2), 303\u2013338 (2010)","journal-title":"Int. J. Comput. Vis."},{"key":"995_CR45","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., Fei-Fei, L.: Imagenet: a large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255 (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"995_CR46","doi-asserted-by":"crossref","unstructured":"Yu, J., Jiang, Y., Wang, Z., Cao, Z., Huang, T.: Unitbox: an advanced object detection network. In: Proceedings of the 24th ACM International Conference on Multimedia, pp. 516\u2013520 (2016)","DOI":"10.1145\/2964284.2967274"},{"key":"995_CR47","doi-asserted-by":"crossref","unstructured":"Zheng, Z., Wang, P., Liu, W., Li, J., Ye, R., Ren, D.: Distance-IoU loss: faster and better learning for bounding box regression. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp. 12993\u201313000 (2020)","DOI":"10.1609\/aaai.v34i07.6999"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-022-00995-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-022-00995-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-022-00995-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,3]],"date-time":"2024-10-03T22:09:02Z","timestamp":1727993342000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-022-00995-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,15]]},"references-count":48,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2023,2]]}},"alternative-id":["995"],"URL":"https:\/\/doi.org\/10.1007\/s00530-022-00995-7","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"value":"0942-4962","type":"print"},{"value":"1432-1882","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,9,15]]},"assertion":[{"value":"15 October 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 August 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 September 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}