{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T07:18:53Z","timestamp":1777879133966,"version":"3.51.4"},"reference-count":169,"publisher":"Springer Science and Business Media LLC","issue":"41","license":[{"start":{"date-parts":[[2024,3,26]],"date-time":"2024-03-26T00:00:00Z","timestamp":1711411200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,3,26]],"date-time":"2024-03-26T00:00:00Z","timestamp":1711411200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-18866-w","type":"journal-article","created":{"date-parts":[[2024,3,26]],"date-time":"2024-03-26T06:19:47Z","timestamp":1711433987000},"page":"88645-88680","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":26,"title":["Small object detection in diverse application landscapes: a survey"],"prefix":"10.1007","volume":"83","author":[{"family":"Iqra","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8792-5011","authenticated-orcid":false,"given":"Kaisar J.","family":"Giri","sequence":"additional","affiliation":[]},{"given":"Mohammed","family":"Javed","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,3,26]]},"reference":[{"key":"18866_CR1","first-page":"1","volume-title":"Object detection","author":"Y Amit","year":"2020","unstructured":"Amit Y, Felzenszwalb P, Girshick R (2020) Object detection. A Reference Guide, Computer Vision, pp 1\u20139"},{"key":"18866_CR2","doi-asserted-by":"crossref","first-page":"103514","DOI":"10.1016\/j.dsp.2022.103514","volume":"126","author":"SSA Zaidi","year":"2022","unstructured":"Zaidi SSA, Ansari MS, Aslam A, Kanwal N, Asghar M, Lee B (2022) A survey of modern deep learning based object detection models. Digit Signal Process 126:103514","journal-title":"Digit Signal Process"},{"key":"18866_CR3","doi-asserted-by":"crossref","first-page":"114602","DOI":"10.1016\/j.eswa.2021.114602","volume":"172","author":"Y Liu","year":"2021","unstructured":"Liu Y, Sun P, Wergeles N, Shang Y (2021) A survey and performance evaluation of deep learning methods for small object detection. Expert Syst Appl 172:114602","journal-title":"Expert Syst Appl"},{"key":"18866_CR4","doi-asserted-by":"crossref","unstructured":"Wang Q,\u00a0Zhang L,\u00a0Bertinetto L,\u00a0Hu W, Torr PH (2019) Fast online object tracking and segmentation: a unifying approach. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 1328\u20131338","DOI":"10.1109\/CVPR.2019.00142"},{"issue":"6","key":"18866_CR5","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3295748","volume":"51","author":"MZ Hossain","year":"2019","unstructured":"Hossain MZ, Sohel F, Shiratuddin MF, Laga H (2019) A comprehensive survey of deep learning for image captioning. ACM Comput Surv (CsUR) 51(6):1\u201336","journal-title":"ACM Comput Surv (CsUR)"},{"key":"18866_CR6","doi-asserted-by":"crossref","unstructured":"Cordts M,\u00a0Omran M,\u00a0Ramos S,\u00a0Rehfeld T,\u00a0Enzweiler M,\u00a0Benenson R,\u00a0Franke U,\u00a0Roth S,\u00a0Schiele B (2016) The cityscapes dataset for semantic urban scene understanding. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3213\u20133223","DOI":"10.1109\/CVPR.2016.350"},{"key":"18866_CR7","unstructured":"Gould S,\u00a0Baumstarck P,\u00a0Quigley M, Ng AY,\u00a0Koller D (2008) Integrating visual and range data for robotic object detection. In: Workshop on multi-camera and multi-modal sensor fusion algorithms and applications-M2SFA2, 2008"},{"key":"18866_CR8","unstructured":"Zhu P,\u00a0Wen L,\u00a0Du D,\u00a0Bian X,\u00a0Ling H,\u00a0Hu Q,\u00a0Nie Q,\u00a0Cheng H,\u00a0Liu C,\u00a0Liu X et\u00a0al (2018) Visdrone-det2018: the vision meets drone object detection in image challenge results. In: Proceedings of the european conference on computer vision (ECCV) workshops, pp 0\u20130"},{"issue":"6","key":"18866_CR9","doi-asserted-by":"crossref","first-page":"1747","DOI":"10.1016\/j.cja.2020.02.024","volume":"33","author":"L Yundong","year":"2020","unstructured":"Yundong L, Han D, Hongguang L, Zhang X, Zhang B, Zhifeng X (2020) Multi-block ssd based on small object detection for uav railway scene surveillance. Chin J Aeronaut 33(6):1747\u20131755","journal-title":"Chin J Aeronaut"},{"key":"18866_CR10","doi-asserted-by":"crossref","first-page":"103910","DOI":"10.1016\/j.imavis.2020.103910","volume":"97","author":"K Tong","year":"2020","unstructured":"Tong K, Wu Y, Zhou F (2020) Recent advances in small object detection based on deep learning: a review. Image Vis Comput 97:103910","journal-title":"Image Vis Comput"},{"key":"18866_CR11","doi-asserted-by":"crossref","unstructured":"Cheng G,\u00a0Yuan X,\u00a0Yao X,\u00a0Yan K,\u00a0Zeng Q,\u00a0Xie X,\u00a0Han J (2023) Towards large-scale small object detection: Survey and benchmarks. IEEE Trans Pattern Anal Mach Intell","DOI":"10.1109\/TPAMI.2023.3290594"},{"key":"18866_CR12","doi-asserted-by":"crossref","unstructured":"Lin T-Y,\u00a0Maire M,\u00a0Belongie S,\u00a0Hays J,\u00a0Perona P,\u00a0Ramanan D,\u00a0Doll\u00e1r P, Zitnick CL (2014) Microsoft coco: common objects in context. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13. Springer, pp 740\u2013755","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"18866_CR13","doi-asserted-by":"crossref","unstructured":"Lee J,\u00a0Bang J, Yang S-I (2017) Object detection with sliding window in images including multiple similar objects. In: 2017 international conference on information and communication technology convergence (ICTC). IEEE, pp 803\u2013806","DOI":"10.1109\/ICTC.2017.8190786"},{"key":"18866_CR14","unstructured":"Hashemi NS, Aghdam RB, Ghiasi ASB,\u00a0Fatemi P (2016) Template matching advances and applications in image analysis. arXiv:1610.07231"},{"key":"18866_CR15","doi-asserted-by":"crossref","unstructured":"Choi C, Christensen HI (2012) 3d textureless object detection and tracking: an edge-based approach. In: 2012 IEEE\/RSJ International conference on intelligent robots and systems. IEEE, pp 3877\u20133884","DOI":"10.1109\/IROS.2012.6386065"},{"key":"18866_CR16","doi-asserted-by":"publisher","unstructured":"Jeelani Z,\u00a0Qadir F (2022) Cellular automata-based approach for salt-and-pepper noise filtration. J King Saud University - Comp Inf Sci 34(2):365\u2013374. https:\/\/doi.org\/10.1016\/j.jksuci.2018.12.006","DOI":"10.1016\/j.jksuci.2018.12.006"},{"key":"18866_CR17","doi-asserted-by":"publisher","unstructured":"Jeelani Z,\u00a0Gani G,\u00a0Qadir F (2023) Linear cellular automata-based impulse noise identification and filtration of degraded images. SIViP 17(6):2679\u20132687. https:\/\/doi.org\/10.1007\/s11760-023-02484-4","DOI":"10.1007\/s11760-023-02484-4"},{"key":"18866_CR18","doi-asserted-by":"crossref","unstructured":"Papageorgiou CP,\u00a0Oren M,\u00a0Poggio T (1998) A general framework for object detection. In: Sixth international conference on computer vision (IEEE Cat. No. 98CH36271). IEEE, pp 555\u2013562","DOI":"10.1109\/ICCV.1998.710772"},{"key":"18866_CR19","doi-asserted-by":"crossref","unstructured":"Dalal N,\u00a0Triggs B (2005) Histograms of oriented gradients for human detection. In: 2005 IEEE computer society conference on computer vision and pattern recognition (CVPR\u201905), vol\u00a01. Ieee, pp 886\u2013893","DOI":"10.1109\/CVPR.2005.177"},{"issue":"8","key":"18866_CR20","doi-asserted-by":"crossref","first-page":"573","DOI":"10.1016\/j.imavis.2012.06.004","volume":"30","author":"P Piccinini","year":"2012","unstructured":"Piccinini P, Prati A, Cucchiara R (2012) Real-time object detection and localization with sift-based clustering. Image Vis Comput 30(8):573\u2013587","journal-title":"Image Vis Comput"},{"key":"18866_CR21","doi-asserted-by":"publisher","unstructured":"Viola P,\u00a0Jones M (2001) Rapid object detection using a boosted cascade of simple features. In: Proceedings of the 2001 IEEE computer society conference on computer vision and pattern recognition. CVPR. IEEE Comput Soc. https:\/\/doi.org\/10.1109\/cvpr.2001.990517","DOI":"10.1109\/cvpr.2001.990517"},{"key":"18866_CR22","doi-asserted-by":"crossref","unstructured":"Malisiewicz T,\u00a0Gupta A, Efros AA (2011) Ensemble of exemplar-svms for object detection and beyond. In: 2011 International conference on computer vision. IEEE, pp 89\u201396","DOI":"10.1109\/ICCV.2011.6126229"},{"issue":"6","key":"18866_CR23","doi-asserted-by":"crossref","first-page":"1243","DOI":"10.1109\/TPAMI.2015.2474388","volume":"38","author":"S Paisitkriangkrai","year":"2015","unstructured":"Paisitkriangkrai S, Shen C, van den Hengel A (2015) Pedestrian detection with spatially pooled features and structured ensemble learning. IEEE Trans Pattern Anal Mach Intell 38(6):1243\u20131257","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"18866_CR24","doi-asserted-by":"crossref","unstructured":"Rashid Y, Bhat JI (2023) Topological to deep learning era for identifying influencers in online social networks: a systematic review. Multimed Tools Appl 1\u201344","DOI":"10.1007\/s11042-023-16002-8"},{"issue":"25","key":"18866_CR25","doi-asserted-by":"crossref","first-page":"1857","DOI":"10.17485\/IJST\/v16i25.841","volume":"16","author":"Y Rashid","year":"2023","unstructured":"Rashid Y, Iqbal Bhat J (2023) Unlocking the power of social networks with community detection techniques for isolated and overlapped communities: a review. Indian J Sci Technol 16(25):1857\u20131871","journal-title":"Indian J Sci Technol"},{"key":"18866_CR26","doi-asserted-by":"publisher","unstructured":"Redmon J,\u00a0Divvala S,\u00a0Girshick R,\u00a0Farhadi A (2016) You only look once: unified, real-time object detection. In: 2016 IEEE conference on computer vision and pattern recognition (CVPR). IEEE. [Online]. Available: https:\/\/doi.org\/10.1109\/cvpr.2016.91","DOI":"10.1109\/cvpr.2016.91"},{"issue":"10","key":"18866_CR27","doi-asserted-by":"crossref","first-page":"2323","DOI":"10.3390\/electronics12102323","volume":"12","author":"H Lou","year":"2023","unstructured":"Lou H, Duan X, Guo J, Liu H, Gu J, Bi L, Chen H (2023) Dc-yolov8: small-size object detection algorithm based on camera sensor. Electronics 12(10):2323","journal-title":"Electronics"},{"key":"18866_CR28","doi-asserted-by":"publisher","unstructured":"Girshick R (2015) Fast r-CNN. In: 2015 IEEE international conference on computer vision (ICCV). IEEE. https:\/\/doi.org\/10.1109\/iccv.2015.169","DOI":"10.1109\/iccv.2015.169"},{"issue":"2","key":"18866_CR29","doi-asserted-by":"crossref","first-page":"1425","DOI":"10.1007\/s42835-021-00960-w","volume":"17","author":"J Meng","year":"2022","unstructured":"Meng J, Jiang P, Wang J, Wang K (2022) A mobilenet-ssd model with fpn for waste detection. J Electr Engineer Technol 17(2):1425\u20131431","journal-title":"J Electr Engineer Technol"},{"key":"18866_CR30","doi-asserted-by":"crossref","first-page":"107929","DOI":"10.1016\/j.patcog.2021.107929","volume":"116","author":"B Bosquet","year":"2021","unstructured":"Bosquet B, Mucientes M, Brea VM (2021) Stdnet-st: spatio-temporal convnet for small object detection. Pattern Recog 116:107929","journal-title":"Pattern Recog"},{"key":"18866_CR31","doi-asserted-by":"crossref","unstructured":"Bai Y,\u00a0Zhang Y,\u00a0Ding M,\u00a0Ghanem B (2018) Sod-mtgan: small object detection via multi-task generative adversarial network. In: Proceedings of the European conference on computer vision (ECCV), pp 206\u2013221","DOI":"10.1007\/978-3-030-01261-8_13"},{"key":"18866_CR32","doi-asserted-by":"crossref","unstructured":"Xu X,\u00a0Zhang H,\u00a0Ma Y,\u00a0Liu K,\u00a0Bao H,\u00a0Qian X (2023) Transdet: toward effective transfer learning for small-object detection. Remote Sens 15(14)3525","DOI":"10.3390\/rs15143525"},{"key":"18866_CR33","unstructured":"Tang Y-P, Wei X-S,\u00a0Zhao B, Huang S-J (2021) Qbox: partial transfer learning with active querying for object detection. IEEE transactions on neural networks and learning systems"},{"key":"18866_CR34","doi-asserted-by":"crossref","unstructured":"Carion N,\u00a0Massa F,\u00a0Synnaeve G,\u00a0Usunier N,\u00a0Kirillov A,\u00a0Zagoruyko S (2020) End-to-end object detection with transformers. In: European conference on computer vision. Springer, pp 213\u2013229","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"18866_CR35","unstructured":"Dosovitskiy A,\u00a0Beyer L,\u00a0Kolesnikov A,\u00a0Weissenborn D,\u00a0Zhai X,\u00a0Unterthiner T,\u00a0Dehghani M,\u00a0Minderer M,\u00a0Heigold G,\u00a0Gelly S et\u00a0al (2020) An image is worth 16x16 words: transformers for image recognition at scale. arXiv:2010.11929"},{"issue":"12","key":"18866_CR36","doi-asserted-by":"crossref","first-page":"2861","DOI":"10.3390\/rs14122861","volume":"14","author":"H Gong","year":"2022","unstructured":"Gong H, Mu T, Li Q, Dai H, Li C, He Z, Wang W, Han F, Tuniyazi A, Li H et al (2022) Swin-transformer-enabled yolov5 with attention mechanism for small object detection on satellite images. Remote Sens 14(12):2861","journal-title":"Remote Sens"},{"issue":"2","key":"18866_CR37","doi-asserted-by":"crossref","first-page":"936","DOI":"10.1109\/TSMC.2020.3005231","volume":"52","author":"G Chen","year":"2020","unstructured":"Chen G, Wang H, Chen K, Li Z, Song Z, Liu Y, Chen W, Knoll A (2020) A survey of the four pillars for small object detection: multiscale representation, contextual information, super-resolution, and region proposal. IEEE Trans Syst Man Cybern Syst 52(2):936\u2013953","journal-title":"IEEE Trans Syst Man Cybern Syst"},{"issue":"1","key":"18866_CR38","first-page":"615","volume":"25","author":"S Mushtaq","year":"2024","unstructured":"Mushtaq S, Singh O (2024) Convolution neural networks for disease prediction: applications and challenges. Scalable Comput: Pract Experience 25(1):615\u2013636","journal-title":"Scalable Comput: Pract Experience"},{"key":"18866_CR39","doi-asserted-by":"crossref","unstructured":"Tan K,\u00a0Ding S,\u00a0Wu S,\u00a0Tian K,\u00a0Ren J et\u00a0al (2023) A small object detection network based on multiple feature enhancement and feature fusion. Sci Program 2023","DOI":"10.1155\/2023\/5500078"},{"key":"18866_CR40","doi-asserted-by":"crossref","unstructured":"Modegi T (2008) Small object recognition techniques based on structured template matching for high-resolution satellite images. In: 2008 SICE Annual Conference. IEEE, pp 2168\u20132173","DOI":"10.1109\/SICE.2008.4655022"},{"key":"18866_CR41","doi-asserted-by":"crossref","unstructured":"Nagaraj S,\u00a0Muthiyan B,\u00a0Ravi S,\u00a0Menezes V,\u00a0Kapoor K,\u00a0Jeon H (2017) Edge-based street object detection. In: 2017 IEEE SmartWorld, Ubiquitous Intelligence & Computing, Advanced & Trusted Computed, Scalable Computing & Communications, Cloud & Big Data Computing, Internet of People and Smart City Innovation (SmartWorld\/SCALCOM\/UIC\/ATC\/CBDCom\/IOP\/SCI). IEEE, pp 1\u20134","DOI":"10.1109\/UIC-ATC.2017.8397675"},{"key":"18866_CR42","doi-asserted-by":"crossref","unstructured":"Arunmozhi A,\u00a0Park J (2018) Comparison of hog, lbp and haar-like features for on-road vehicle detection. In: 2018 IEEE international conference on Electro\/Information Technology (EIT). IEEE, pp 0362\u20130367","DOI":"10.1109\/EIT.2018.8500159"},{"issue":"5","key":"18866_CR43","doi-asserted-by":"crossref","first-page":"813","DOI":"10.3390\/app8050813","volume":"8","author":"Y Ren","year":"2018","unstructured":"Ren Y, Zhu C, Xiao S (2018) Small object detection in optical remote sensing images via modified faster r-cnn. Appl Sci 8(5):813","journal-title":"Appl Sci"},{"key":"18866_CR44","doi-asserted-by":"crossref","unstructured":"Kisantal M,\u00a0Wojna Z,\u00a0Murawski J,\u00a0Naruniec J,\u00a0Cho K (2019) Augmentation for small object detection. arXiv:1902.07296","DOI":"10.5121\/csit.2019.91713"},{"key":"18866_CR45","doi-asserted-by":"crossref","unstructured":"Lim J-S,\u00a0Astrid M, Yoon H-J, Lee S-I (2021) Small object detection using context and attention. In: 2021 International conference on artificial intelligence in information and communication (ICAIIC). IEEE, pp 181\u2013186","DOI":"10.1109\/ICAIIC51459.2021.9415217"},{"key":"18866_CR46","doi-asserted-by":"crossref","first-page":"364","DOI":"10.1109\/TIP.2022.3228497","volume":"32","author":"X Wu","year":"2022","unstructured":"Wu X, Hong D, Chanussot J (2022) Uiu-net: U-net in u-net for infrared small object detection. IEEE transactions on image processing 32:364\u2013376","journal-title":"IEEE transactions on image processing"},{"key":"18866_CR47","doi-asserted-by":"crossref","first-page":"115","DOI":"10.1016\/j.patrec.2023.03.009","volume":"168","author":"B Mahaur","year":"2023","unstructured":"Mahaur B, Mishra K (2023) Small-object detection based on yolov5 in autonomous driving systems. Pattern Recogn Lett 168:115\u2013122","journal-title":"Pattern Recogn Lett"},{"issue":"3","key":"18866_CR48","doi-asserted-by":"crossref","first-page":"339","DOI":"10.3390\/rs11030339","volume":"11","author":"C Chen","year":"2019","unstructured":"Chen C, Gong W, Chen Y, Li W (2019) Object detection in remote sensing images based on a scene-contextual feature pyramid network. Remote Sens 11(3):339","journal-title":"Remote Sens"},{"key":"18866_CR49","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1016\/j.neucom.2020.12.093","volume":"433","author":"J Leng","year":"2021","unstructured":"Leng J, Ren Y, Jiang W, Sun X, Wang Y (2021) Realize your surroundings: exploiting context information for small object detection. Neurocomputing 433:287\u2013299","journal-title":"Neurocomputing"},{"key":"18866_CR50","doi-asserted-by":"crossref","unstructured":"Hamdi A, Chan YK, Koo VC (2021) A new image enhancement and super resolution technique for license plate recognition. Heliyon 7(11)","DOI":"10.1016\/j.heliyon.2021.e08341"},{"key":"18866_CR51","doi-asserted-by":"crossref","unstructured":"Li J,\u00a0Liang X,\u00a0Wei Y,\u00a0Xu T,\u00a0Feng J,\u00a0Yan S (2017) Perceptual generative adversarial networks for small object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1222\u20131230","DOI":"10.1109\/CVPR.2017.211"},{"key":"18866_CR52","doi-asserted-by":"crossref","unstructured":"Krishna H,\u00a0Jawahar C (2017) Improving small object detection. In: 2017 4th IAPR Asian conference on pattern recognition (ACPR). IEEE, pp 340\u2013345","DOI":"10.1109\/ACPR.2017.149"},{"key":"18866_CR53","doi-asserted-by":"crossref","unstructured":"Li C,\u00a0Zhang Y,\u00a0Gao G,\u00a0Liu Z,\u00a0Liao L (2022) Context-aware cross-level attention fusion network for infrared small target detection. J Appl Remote Sens 16(4):046\u00a0506\u2013046\u00a0506","DOI":"10.1117\/1.JRS.16.046506"},{"key":"18866_CR54","doi-asserted-by":"crossref","unstructured":"Hoiem D,\u00a0Chodpathumwan Y,\u00a0Dai Q (2012) Diagnosing error in object detectors. In: European conference on computer vision. Springer, pp 340\u2013353","DOI":"10.1007\/978-3-642-33712-3_25"},{"key":"18866_CR55","unstructured":"Huang J,\u00a0Murphy K (2015) Efficient inference in occlusion-aware generative models of images. arXiv:1511.06362"},{"key":"18866_CR56","doi-asserted-by":"crossref","unstructured":"Chen Y-T,\u00a0Liu X, Yang M-H (2015) Multi-instance object segmentation with occlusion handling. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3470\u20133478","DOI":"10.1109\/CVPR.2015.7298969"},{"key":"18866_CR57","doi-asserted-by":"crossref","unstructured":"Zoph B, Cubuk ED,\u00a0Ghiasi G, Lin T-Y,\u00a0Shlens J, Le QV (2020) Learning data augmentation strategies for object detection. In: Computer Vision\u2013ECCV 2020: 16th European conference, Glasgow, UK, August 23\u201328, 2020, proceedings, Part XXVII 16. Springer, pp 566\u2013583","DOI":"10.1007\/978-3-030-58583-9_34"},{"key":"18866_CR58","doi-asserted-by":"crossref","first-page":"94","DOI":"10.1016\/j.neucom.2022.11.039","volume":"520","author":"S Deepak","year":"2023","unstructured":"Deepak S, Ameer P (2023) Brain tumor categorization from imbalanced mri dataset using weighted loss and deep feature fusion. Neurocomputing 520:94\u2013102","journal-title":"Neurocomputing"},{"issue":"3","key":"18866_CR59","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1007\/s10032-019-00335-y","volume":"22","author":"Z Zhong","year":"2019","unstructured":"Zhong Z, Sun L, Huo Q (2019) An anchor-free region proposal network for faster r-cnn-based text detection approaches. Int J Doc Anal Recognit (IJDAR) 22(3):315\u2013327","journal-title":"Int J Doc Anal Recognit (IJDAR)"},{"key":"18866_CR60","unstructured":"Zhang H,\u00a0Li F,\u00a0Liu S,\u00a0Zhang L,\u00a0Su H,\u00a0Zhu J, Ni LM, Shum H-Y (2022) Dino: Detr with improved denoising anchor boxes for end-to-end object detection. arXiv:2203.03605"},{"key":"18866_CR61","doi-asserted-by":"publisher","unstructured":"Doon R, Rawat TK,\u00a0Gautam S (2018) Cifar-10 classification using deep convolutional neural network. In: 2018 IEEE Punecon. IEEE. https:\/\/doi.org\/10.1109\/punecon.2018.8745428","DOI":"10.1109\/punecon.2018.8745428"},{"key":"18866_CR62","doi-asserted-by":"crossref","unstructured":"Truong T-D, Nguyen V-T, Tran M-T (2018) Lightweight deep convolutional network for tiny object recognition. In: ICPRAM, pp 675\u2013682","DOI":"10.5220\/0006752006750682"},{"key":"18866_CR63","doi-asserted-by":"publisher","unstructured":"Mogelmose A,\u00a0Liu D, Trivedi MM (2015) Detection of u.s. traffic signs. IEEE Trans Intell Transp Syst 16(6):3116\u20133125. https:\/\/doi.org\/10.1109\/tits.2015.2433019","DOI":"10.1109\/tits.2015.2433019"},{"key":"18866_CR64","doi-asserted-by":"publisher","unstructured":"Kuznetsova A,\u00a0Rom H,\u00a0Alldrin N,\u00a0Uijlings J,\u00a0Krasin I,\u00a0Pont-Tuset J,\u00a0Kamali S,\u00a0Popov S,\u00a0Malloci M,\u00a0Kolesnikov A,\u00a0Duerig T,\u00a0Ferrari V (2020) The open images dataset v4. Int J Comput Vis 128(7):1956\u20131981. https:\/\/doi.org\/10.1007\/s11263-020-01316-z","DOI":"10.1007\/s11263-020-01316-z"},{"key":"18866_CR65","doi-asserted-by":"publisher","unstructured":"Lin T-Y,\u00a0Maire M,\u00a0Belongie S,\u00a0Hays J,\u00a0Perona P,\u00a0Ramanan D,\u00a0Doll\u00e1r P, Zitnick CL (2014) Microsoft COCO: common objects in context. In: Computer vision \u2013 ECCV 2014. Springer International Publishing, pp 740\u2013755. https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"18866_CR66","doi-asserted-by":"publisher","unstructured":"Loh YP, Chan CS (2019) Getting to know low-light images with the exclusively dark dataset. Comp Vision Image Underst 178:30\u201342. https:\/\/doi.org\/10.1016\/j.cviu.2018.10.010","DOI":"10.1016\/j.cviu.2018.10.010"},{"key":"18866_CR67","doi-asserted-by":"publisher","unstructured":"Wang X,\u00a0Yang M,\u00a0Zhu S,\u00a0Lin Y (2013) Regionlets for generic object detection. In: 2013 IEEE international conference on computer vision. IEEE. https:\/\/doi.org\/10.1109\/iccv.2013.10","DOI":"10.1109\/iccv.2013.10"},{"key":"18866_CR68","doi-asserted-by":"publisher","unstructured":"Yu F,\u00a0Chen H,\u00a0Wang X,\u00a0Xian W,\u00a0Chen Y,\u00a0Liu F,\u00a0Madhavan V,\u00a0Darrell T (2020) BDD100k: a diverse driving dataset for heterogeneous multitask learning. In: 2020 IEEE\/CVF conference on computer vision and pattern recognition (CVPR). IEEE. https:\/\/doi.org\/10.1109\/cvpr42600.2020.00271","DOI":"10.1109\/cvpr42600.2020.00271"},{"key":"18866_CR69","doi-asserted-by":"publisher","unstructured":"Xia G-S,\u00a0Bai X,\u00a0Ding J,\u00a0Zhu Z,\u00a0Belongie S,\u00a0Luo J,\u00a0Datcu M,\u00a0Pelillo M,\u00a0Zhang L (2018) DOTA: a large-scale dataset for object detection in aerial images. In: 2018 IEEE\/CVF conference on computer vision and pattern recognition. IEEE. https:\/\/doi.org\/10.1109\/cvpr.2018.00418","DOI":"10.1109\/cvpr.2018.00418"},{"key":"18866_CR70","unstructured":"Krizhevsky A,\u00a0Hinton G (2010) Convolutional deep belief networks on cifar-10. Unpublished manuscript 40(7):1\u20139"},{"key":"18866_CR71","unstructured":"Recht B,\u00a0Roelofs R,\u00a0Schmidt L,\u00a0Shankar V (2018) Do cifar-10 classifiers generalize to cifar-10? arXiv:1806.00451"},{"key":"18866_CR72","doi-asserted-by":"crossref","unstructured":"M\u00f8gelmose A,\u00a0Liu D, Trivedi MM (2014) Traffic sign detection for us roads: remaining challenges and a case for tracking. In: 17th International IEEE conference on intelligent transportation systems (ITSC). IEEE, pp 1394\u20131399","DOI":"10.1109\/ITSC.2014.6957882"},{"issue":"4","key":"18866_CR73","doi-asserted-by":"crossref","first-page":"043008","DOI":"10.1103\/PhysRevD.75.043008","volume":"75","author":"J Crowder","year":"2007","unstructured":"Crowder J, Cornish NJ (2007) Solution to the galactic foreground problem for Lisa. Phys Rev D 75(4):043008","journal-title":"Phys Rev D"},{"key":"18866_CR74","doi-asserted-by":"crossref","unstructured":"Lin T-Y,\u00a0Maire M,\u00a0Belongie S,\u00a0Hays J,\u00a0Perona P,\u00a0Ramanan D,\u00a0Doll\u00e1r P, Zitnick CL (2014) Microsoft coco: common objects in context. In: Computer vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, proceedings, Part V 13. Springer, pp 740\u2013755","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"18866_CR75","unstructured":"Barbu A,\u00a0Mayo D,\u00a0Alverio J,\u00a0Luo W,\u00a0Wang C,\u00a0Gutfreund D,\u00a0Tenenbaum J,\u00a0Katz B (2019) Objectnet: a large-scale bias-controlled dataset for pushing the limits of object recognition models. Adv Neural Inf Process Syst 32"},{"key":"18866_CR76","doi-asserted-by":"crossref","unstructured":"Dabov K,\u00a0Foi A,\u00a0Katkovnik V,\u00a0Egiazarian K (2006) Image denoising with block-matching and 3d filtering. In: Image processing: algorithms and systems, neural networks, and machine learning, vol 6064. SPIE, pp 354\u2013365","DOI":"10.1117\/12.643267"},{"key":"18866_CR77","doi-asserted-by":"crossref","first-page":"30","DOI":"10.1016\/j.cviu.2018.10.010","volume":"178","author":"YP Loh","year":"2019","unstructured":"Loh YP, Chan CS (2019) Getting to know low-light images with the exclusively dark dataset. Comp Vision Image Underst 178:30\u201342","journal-title":"Comp Vision Image Underst"},{"key":"18866_CR78","doi-asserted-by":"crossref","unstructured":"Deng J,\u00a0Dong W,\u00a0Socher R, Li L-J,\u00a0Li K,\u00a0Fei-Fei L (2009) Imagenet: a large-scale hierarchical image database. In: 2009 IEEE conference on computer vision and pattern recognition. Ieee, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"18866_CR79","unstructured":"Barbu A,\u00a0Mayo D,\u00a0Alverio J,\u00a0Luo W,\u00a0Wang C,\u00a0Gutfreund D,\u00a0Tenenbaum J,\u00a0Katz B (2019) Objectnet: a large-scale bias-controlled dataset for pushing the limits of object recognition models. Adv Neural Inf Process Syst 32"},{"key":"18866_CR80","doi-asserted-by":"crossref","unstructured":"Yu F,\u00a0Chen H,\u00a0Wang X,\u00a0Xian W,\u00a0Chen Y,\u00a0Liu F,\u00a0Madhavan V,\u00a0Darrell T (2020) Bdd100k: a diverse driving dataset for heterogeneous multitask learning. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2636\u20132645","DOI":"10.1109\/CVPR42600.2020.00271"},{"key":"18866_CR81","doi-asserted-by":"crossref","unstructured":"Haris M,\u00a0Glowacz A (2021) Road object detection: a comparative study of deep learning-based algorithms. Electronics 10(16):1932","DOI":"10.3390\/electronics10161932"},{"key":"18866_CR82","doi-asserted-by":"crossref","unstructured":"Xia G-S,\u00a0Bai X,\u00a0Ding J,\u00a0Zhu Z,\u00a0Belongie S,\u00a0Luo J,\u00a0Datcu M,\u00a0Pelillo M,\u00a0Zhang L (2018) Dota: A large-scale dataset for object detection in aerial images. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3974\u20133983","DOI":"10.1109\/CVPR.2018.00418"},{"key":"18866_CR83","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1016\/j.isprsjprs.2022.06.002","volume":"190","author":"C Xu","year":"2022","unstructured":"Xu C, Wang J, Yang W, Yu H, Yu L, Xia G-S (2022) Detecting tiny objects in aerial images: a normalized wasserstein distance and a new benchmark. ISPRS J Photogramm Remote Sens 190:79\u201393","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"18866_CR84","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1016\/j.isprsjprs.2022.06.002","volume":"190","author":"C Xu","year":"2022","unstructured":"Xu C, Wang J, Yang W, Yu H, Yu L, Xia G-S (2022) Detecting tiny objects in aerial images: A normalized wasserstein distance and a new benchmark. ISPRS J Photogramm Remote Sens 190:79\u201393","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"18866_CR85","doi-asserted-by":"crossref","unstructured":"Yu X,\u00a0Gong Y,\u00a0Jiang N,\u00a0Ye Q,\u00a0Han Z (2020) Scale match for tiny person detection. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp 1257\u20131265","DOI":"10.1109\/WACV45572.2020.9093394"},{"key":"18866_CR86","doi-asserted-by":"crossref","unstructured":"Yu X,\u00a0Han Z,\u00a0Gong Y,\u00a0Jan N,\u00a0Zhao J,\u00a0Ye Q,\u00a0Chen J,\u00a0Feng Y,\u00a0Zhang B,\u00a0Wang X et\u00a0al (2020) The 1st tiny object detection challenge: methods and results. In: Computer vision\u2013ECCV 2020 workshops: Glasgow, UK, August 23\u201328, 2020, proceedings, Part V 16. Springer, 315\u2013323","DOI":"10.1007\/978-3-030-68238-5_23"},{"issue":"7","key":"18866_CR87","doi-asserted-by":"crossref","first-page":"1956","DOI":"10.1007\/s11263-020-01316-z","volume":"128","author":"A Kuznetsova","year":"2020","unstructured":"Kuznetsova A, Rom H, Alldrin N, Uijlings J, Krasin I, Pont-Tuset J, Kamali S, Popov S, Malloci M, Kolesnikov A et al (2020) The open images dataset v4: unified image classification, object detection, and visual relationship detection at scale. Int J Comput Vis 128(7):1956\u20131981","journal-title":"Int J Comput Vis"},{"key":"18866_CR88","doi-asserted-by":"crossref","unstructured":"Du D,\u00a0Qi Y,\u00a0Yu H,\u00a0Yang Y,\u00a0Duan K,\u00a0Li G,\u00a0Zhang W,\u00a0Huang Q,\u00a0Tian Q (2018) The unmanned aerial vehicle benchmark: object detection and tracking. In: Proceedings of the European conference on computer vision (ECCV), pp 370\u2013386","DOI":"10.1007\/978-3-030-01249-6_23"},{"key":"18866_CR89","doi-asserted-by":"crossref","unstructured":"Yu W,\u00a0Yang T,\u00a0Chen C (2021) Towards resolving the challenge of long-tail distribution in uav images for object detection. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp 3258\u20133267","DOI":"10.1109\/WACV48630.2021.00330"},{"key":"18866_CR90","doi-asserted-by":"crossref","unstructured":"Wang J,\u00a0Yang W,\u00a0Guo H,\u00a0Zhang R, Xia G-S (2021) Tiny object detection in aerial images. In: 2020 25th international conference on pattern recognition (ICPR). IEEE, pp 3791\u20133798","DOI":"10.1109\/ICPR48806.2021.9413340"},{"key":"18866_CR91","doi-asserted-by":"crossref","unstructured":"Du D,\u00a0Qi Y,\u00a0Yu H,\u00a0Yang Y,\u00a0Duan K,\u00a0Li G,\u00a0Zhang W,\u00a0Huang Q,\u00a0Tian Q (2018) The unmanned aerial vehicle benchmark: object detection and tracking. In: Proceedings of the European conference on computer vision (ECCV), pp 370\u2013386","DOI":"10.1007\/978-3-030-01249-6_23"},{"key":"18866_CR92","doi-asserted-by":"crossref","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2020","unstructured":"Li K, Wan G, Cheng G, Meng L, Han J (2020) Object detection in optical remote sensing images: a survey and a new benchmark. ISPRS J Photogramm Remote Sens 159:296\u2013307","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"18866_CR93","doi-asserted-by":"crossref","unstructured":"Yang S,\u00a0Luo P, Loy C-C,\u00a0Tang X (2016) Wider face: a face detection benchmark. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5525\u20135533","DOI":"10.1109\/CVPR.2016.596"},{"key":"18866_CR94","doi-asserted-by":"publisher","unstructured":"Prasad S,\u00a0Li Y,\u00a0Lin D,\u00a0Sheng D (2021) maskedFaceNet: a progressive semi-supervised masked face detector. In: 2021 IEEE Winter conference on applications of computer vision (WACV). IEEE. https:\/\/doi.org\/10.1109\/wacv48630.2021.00343","DOI":"10.1109\/wacv48630.2021.00343"},{"key":"18866_CR95","doi-asserted-by":"crossref","first-page":"105585","DOI":"10.1016\/j.compag.2020.105585","volume":"175","author":"Q-J Wang","year":"2020","unstructured":"Wang Q-J, Zhang S-Y, Dong S-F, Zhang G-C, Yang J, Li R, Wang H-Q (2020) Pest24: a large-scale very small object data set of agricultural pests for multi-target detection. Comput Electron Agric 175:105585","journal-title":"Comput Electron Agric"},{"key":"18866_CR96","doi-asserted-by":"publisher","unstructured":"Liu W,\u00a0Anguelov D,\u00a0Erhan D,\u00a0Szegedy C,\u00a0Reed S, Fu C-Y, Berg AC (2016) SSD: single shot MultiBox detector. In: Computer vision \u2013 ECCV 2016. Springer International Publishing, pp 21\u201337. https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"18866_CR97","doi-asserted-by":"crossref","unstructured":"Cai Z,\u00a0Vasconcelos N (2018) Cascade r-cnn: Delving into high quality object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 6154\u20136162","DOI":"10.1109\/CVPR.2018.00644"},{"key":"18866_CR98","unstructured":"Farhadi A,\u00a0Redmon J (2018) Yolov3: an incremental improvement. In: Computer vision and pattern recognition, pp 1804\u201302\u00a0767"},{"key":"18866_CR99","unstructured":"Donahue J,\u00a0Jia Y,\u00a0Vinyals O,\u00a0Hoffman J,\u00a0Zhang N,\u00a0Tzeng E,\u00a0Darrell T (2014) Decaf: a deep convolutional activation feature for generic visual recognition. In: International conference on machine learning. PMLR, pp 647\u2013655"},{"key":"18866_CR100","doi-asserted-by":"crossref","unstructured":"Mathew MP, Mahesh TY (2022) Leaf-based disease detection in bell pepper plant using yolo v5. SIViP 1\u20137","DOI":"10.1007\/s11760-021-02024-y"},{"key":"18866_CR101","doi-asserted-by":"crossref","first-page":"638182","DOI":"10.3389\/fonc.2021.638182","volume":"11","author":"R Yang","year":"2021","unstructured":"Yang R, Yu Y (2021) Artificial convolutional neural network in object detection and semantic segmentation for medical imaging analysis. Front Oncol 11:638182","journal-title":"Front Oncol"},{"key":"18866_CR102","doi-asserted-by":"crossref","unstructured":"Shah SNA,\u00a0Parveen R (2023) An extensive review on lung cancer diagnosis using machine learning techniques on radiological data: state-of-the-art and perspectives. Arch Comput Meth Engineer 1\u201314","DOI":"10.1007\/s11831-023-09964-3"},{"issue":"1","key":"18866_CR103","doi-asserted-by":"crossref","first-page":"1","DOI":"10.12785\/ijcds\/140101","volume":"14","author":"S Mushtaq","year":"2023","unstructured":"Mushtaq S, Singh O (2023) Implementing image processing and deep learning techniques to analyze skin cancer images. Int J Comput Digit Syst 14(1):1\u2013xx","journal-title":"Int J Comput Digit Syst"},{"key":"18866_CR104","doi-asserted-by":"crossref","unstructured":"Sushanki S, Bhandari AK, Singh AK (2023) A review on computational methods for breast cancer detection in ultrasound images using multi-image modalities. Arch Comput Meth Engineer 1\u201320","DOI":"10.1007\/s11831-023-10015-0"},{"issue":"22","key":"18866_CR105","doi-asserted-by":"crossref","first-page":"8834","DOI":"10.3390\/s22228834","volume":"22","author":"PK Sahoo","year":"2022","unstructured":"Sahoo PK, Mishra S, Panigrahi R, Bhoi AK, Barsocchi P (2022) An improvised deep-learning-based mask r-cnn model for laryngeal cancer detection using ct images. Sensors 22(22):8834","journal-title":"Sensors"},{"key":"18866_CR106","doi-asserted-by":"crossref","unstructured":"He K,\u00a0Gkioxari G,\u00a0Doll\u00e1r P,\u00a0Girshick R (2017) Mask r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp 2961\u20132969","DOI":"10.1109\/ICCV.2017.322"},{"key":"18866_CR107","doi-asserted-by":"crossref","unstructured":"Abhisheka B, Biswas SK,\u00a0Purkayastha B (2023) A comprehensive review on breast cancer detection, classification and segmentation using deep learning. Arch Comput Meth Engineer 1\u201330","DOI":"10.1007\/s11831-023-09968-z"},{"key":"18866_CR108","doi-asserted-by":"crossref","unstructured":"Khosravan N,\u00a0Bagci U (2018) S4nd: Single-shot single-scale lung nodule detection. In: Medical image computing and computer assisted intervention\u2013MICCAI 2018: 21st International Conference, Granada, Spain, September 16-20, 2018, Proceedings, Part II 11. Springer, pp 794\u2013802","DOI":"10.1007\/978-3-030-00934-2_88"},{"key":"18866_CR109","unstructured":"Van\u00a0Etten A (2018) You only look twice: rapid multi-scale object detection in satellite imagery. arXiv:1805.09512"},{"key":"18866_CR110","doi-asserted-by":"crossref","unstructured":"Nina W,\u00a0Condori W,\u00a0Machaca V,\u00a0Villegas J,\u00a0Castro E (2020) Small ship detection on optical satellite imagery with yolo and yolt. In: Advances in information and communication: proceedings of the 2020 future of information and communication conference (FICC), vol 2. Springer, pp 664\u2013677","DOI":"10.1007\/978-3-030-39442-4_49"},{"key":"18866_CR111","doi-asserted-by":"crossref","unstructured":"Wang J,\u00a0Yang W,\u00a0Guo H,\u00a0Zhang R, Xia G-S (2021) Tiny object detection in aerial images. In: 2020 25th international conference on pattern recognition (ICPR). IEEE, pp 3791\u20133798","DOI":"10.1109\/ICPR48806.2021.9413340"},{"issue":"16","key":"18866_CR112","doi-asserted-by":"crossref","first-page":"7190","DOI":"10.3390\/s23167190","volume":"23","author":"G Wang","year":"2023","unstructured":"Wang G, Chen Y, An P, Hong H, Hu J, Huang T (2023) Uav-yolov8: a small-object-detection model based on improved yolov8 for uav aerial photography scenarios. Sensors 23(16):7190","journal-title":"Sensors"},{"issue":"1","key":"18866_CR113","doi-asserted-by":"crossref","first-page":"117","DOI":"10.3390\/su16010117","volume":"16","author":"I Javid","year":"2023","unstructured":"Javid I, Ghazali R, Saeed W, Batool T, Al-Wajih E (2023) Cnn with new spatial pyramid pooling and advanced filter-based techniques: revolutionizing traffic monitoring via aerial images. Sustainability 16(1):117","journal-title":"Sustainability"},{"issue":"17","key":"18866_CR114","doi-asserted-by":"crossref","first-page":"3664","DOI":"10.3390\/electronics12173664","volume":"12","author":"X Zhai","year":"2023","unstructured":"Zhai X, Huang Z, Li T, Liu H, Wang S (2023) Yolo-drone: an optimized yolov8 network for tiny uav object detection. Electronics 12(17):3664","journal-title":"Electronics"},{"key":"18866_CR115","doi-asserted-by":"crossref","unstructured":"Sun W,\u00a0Dai L,\u00a0Zhang X,\u00a0Chang P,\u00a0He X (2021) Rsod: real-time small object detection algorithm in uav-based traffic monitoring. Appl Intell 1\u201316","DOI":"10.1007\/s10489-021-02893-3"},{"key":"18866_CR116","unstructured":"Gould S,\u00a0Baumstarck P,\u00a0Quigley M, Ng AY,\u00a0Koller D (2008) Integrating visual and range data for robotic object detection. In: Workshop on multi-camera and multi-modal sensor fusion algorithms and applications-M2SFA2 2008"},{"key":"18866_CR117","doi-asserted-by":"crossref","first-page":"103945","DOI":"10.1016\/j.robot.2021.103945","volume":"149","author":"Y Wang","year":"2022","unstructured":"Wang Y, Sun Q, Liu Z, Gu L (2022) Visual detection and tracking algorithms for minimally invasive surgical instruments: a comprehensive review of the state-of-the-art. Robot Auton Syst 149:103945","journal-title":"Robot Auton Syst"},{"issue":"2","key":"18866_CR118","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1109\/MRA.2021.3066040","volume":"28","author":"M Koskinopoulou","year":"2021","unstructured":"Koskinopoulou M, Raptopoulos F, Papadopoulos G, Mavrakis N, Maniadakis M (2021) Robotic waste sorting technology: toward a vision-based categorization system for the industrial robotic separation of recyclable waste. IEEE Robot Autom Mag 28(2):50\u201360","journal-title":"IEEE Robot Autom Mag"},{"key":"18866_CR119","doi-asserted-by":"crossref","unstructured":"Farooq AS,\u00a0Zhang P (2022) A comprehensive review on the prospects of next-generation wearable electronics for individualized health monitoring, assistive robotics, and communication. Sensors Actuators A Phys 113715","DOI":"10.1016\/j.sna.2022.113715"},{"key":"18866_CR120","doi-asserted-by":"crossref","unstructured":"Kulik S,\u00a0Shtanko A (2020) Experiments with neural net object detection system yolo on small training datasets for intelligent robotics. In: Advanced technologies in robotics and intelligent systems: proceedings of ITR 2019. Springer, pp 57\u2013162","DOI":"10.1007\/978-3-030-33491-8_19"},{"issue":"15","key":"18866_CR121","doi-asserted-by":"crossref","first-page":"3296","DOI":"10.3390\/electronics12153296","volume":"12","author":"Y Liu","year":"2023","unstructured":"Liu Y, Li W, Tan L, Huang X, Zhang H, Jiang X (2023) Db-yolov5: a uav object detection model based on dual backbone network for security surveillance. Electronics 12(15):3296","journal-title":"Electronics"},{"issue":"7","key":"18866_CR122","doi-asserted-by":"crossref","first-page":"1359","DOI":"10.1109\/TIFS.2015.2408263","volume":"10","author":"K Lin","year":"2015","unstructured":"Lin K, Chen S-C, Chen C-S, Lin D-T, Hung Y-P (2015) Abandoned object detection via temporal consistency modeling and back-tracing verification for visual surveillance. IEEE Trans Inf Forensic Secur 10(7):1359\u20131370","journal-title":"IEEE Trans Inf Forensic Secur"},{"key":"18866_CR123","doi-asserted-by":"crossref","unstructured":"Xu S,\u00a0Zhang M,\u00a0Song W,\u00a0Mei H,\u00a0He Q,\u00a0Liotta A (2023) A systematic review and analysis of deep learning-based underwater object detection. Neurocomputing","DOI":"10.1016\/j.neucom.2023.01.056"},{"key":"18866_CR124","doi-asserted-by":"crossref","first-page":"246","DOI":"10.1016\/j.dsp.2015.09.020","volume":"48","author":"A Gunes","year":"2016","unstructured":"Gunes A, Guldogan MB (2016) Joint underwater target detection and tracking with the bernoulli filter using an acoustic vector sensor. Digit Signal Process 48:246\u2013258","journal-title":"Digit Signal Process"},{"key":"18866_CR125","doi-asserted-by":"crossref","first-page":"108926","DOI":"10.1016\/j.patcog.2022.108926","volume":"132","author":"L Chen","year":"2022","unstructured":"Chen L, Zhou F, Wang S, Dong J, Li N, Ma H, Wang X, Zhou H (2022) Swipenet: object detection in noisy underwater scenes. Pattern Recog 132:108926","journal-title":"Pattern Recog"},{"issue":"4","key":"18866_CR126","doi-asserted-by":"crossref","first-page":"1076","DOI":"10.3390\/rs15041076","volume":"15","author":"G Chen","year":"2023","unstructured":"Chen G, Mao Wang K, Shen J (2023) Htdet: a hybrid transformer-based approach for underwater small object detection. Remote Sens 15(4):1076","journal-title":"Remote Sens"},{"issue":"1","key":"18866_CR127","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/s40537-019-0197-0","volume":"6","author":"C Shorten","year":"2019","unstructured":"Shorten C, Khoshgoftaar TM (2019) A survey on image data augmentation for deep learning. J Big Data 6(1):1\u201348","journal-title":"J Big Data"},{"key":"18866_CR128","first-page":"1","volume":"70","author":"Y Cai","year":"2021","unstructured":"Cai Y, Luan T, Gao H, Wang H, Chen L, Li Y, Sotelo MA, Li Z (2021) Yolov4-5d: an effective and efficient object detector for autonomous driving. IEEE Trans Instrum Meas 70:1\u201313","journal-title":"IEEE Trans Instrum Meas"},{"key":"18866_CR129","doi-asserted-by":"crossref","unstructured":"Dipu MTA, Hossain SS,\u00a0Arafat Y, Rafiq FB (2021) Real-time driver drowsiness detection using deep learning. Int J Adv Comput Sci Appl 12(7)","DOI":"10.14569\/IJACSA.2021.0120794"},{"key":"18866_CR130","unstructured":"Malkoff DB, Oliver WR (2000) Hyperspectral imaging applied to forensic medicine. In: Spectral imaging: instrumentation, applications, and analysis 3920. SPIE, pp 108\u2013116"},{"issue":"2","key":"18866_CR131","doi-asserted-by":"crossref","first-page":"445","DOI":"10.1016\/j.ifacol.2018.03.076","volume":"51","author":"E Wetzer","year":"2018","unstructured":"Wetzer E, Lohninger H (2018) Image processing using color space models for forensic fiber detection. IFAC-PapersOnLine 51(2):445\u2013450","journal-title":"IFAC-PapersOnLine"},{"key":"18866_CR132","doi-asserted-by":"crossref","unstructured":"Turtiainen H,\u00a0Costin A,\u00a0H\u00e4m\u00e4l\u00e4inen T,\u00a0Lahtinen T,\u00a0Sintonen L (2022) Cctvcv: computer vision model\/dataset supporting cctv forensics and privacy applications. In: 2022 IEEE international conference on trust, security and privacy in computing and communications (TrustCom). IEEE, pp 1219\u20131226","DOI":"10.1109\/TrustCom56396.2022.00169"},{"key":"18866_CR133","doi-asserted-by":"crossref","unstructured":"Akyon FC, Altinuc SO,\u00a0Temizel A (2022) Slicing aided hyper inference and fine-tuning for small object detection. In: 2022 IEEE international conference on image processing (ICIP). IEEE, pp 966\u2013970","DOI":"10.1109\/ICIP46576.2022.9897990"},{"key":"18866_CR134","doi-asserted-by":"crossref","unstructured":"Wang S (2011) A review of gradient-based and edge-based feature extraction methods for object detection. In: 2011 IEEE 11th international conference on computer and information technology. IEEE, pp 277\u2013282","DOI":"10.1109\/CIT.2011.51"},{"key":"18866_CR135","doi-asserted-by":"crossref","unstructured":"Choi C, Christensen HI (2012) 3d textureless object detection and tracking: an edge-based approach. In: 2012 IEEE\/RSJ international conference on intelligent robots and systems. IEEE, pp 3877\u20133884","DOI":"10.1109\/IROS.2012.6386065"},{"key":"18866_CR136","doi-asserted-by":"crossref","first-page":"128","DOI":"10.5201\/ipol.2014.104","volume":"4","author":"Y-Q Wang","year":"2014","unstructured":"Wang Y-Q (2014) An analysis of the viola-jones face detection algorithm. Image Process Line 4:128\u2013148","journal-title":"Image Process Line"},{"issue":"4","key":"18866_CR137","doi-asserted-by":"crossref","first-page":"62","DOI":"10.21275\/v5i4.NOV162465","volume":"5","author":"MK Dabhi","year":"2016","unstructured":"Dabhi MK, Pancholi BK (2016) Face detection system based on viola-jones algorithm. Int J Sci Res (IJSR) 5(4):62\u201364","journal-title":"Int J Sci Res (IJSR)"},{"key":"18866_CR138","doi-asserted-by":"crossref","unstructured":"Ebrahimzadeh R,\u00a0Jampour M (2014) Efficient handwritten digit recognition based on histogram of oriented gradients and svm. Int J Comp Appl 104(9)","DOI":"10.5120\/18229-9167"},{"issue":"2","key":"18866_CR139","doi-asserted-by":"crossref","first-page":"322","DOI":"10.1109\/TITS.2010.2042714","volume":"11","author":"AP Psyllos","year":"2010","unstructured":"Psyllos AP, Anagnostopoulos C-NE, Kayafas E (2010) Vehicle logo recognition using a sift-based enhanced matching scheme. IEEE Trans Intell Transp Syst 11(2):322\u2013328","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"18866_CR140","doi-asserted-by":"publisher","unstructured":"Felzenszwalb P,\u00a0McAllester D,\u00a0Ramanan D (2008) A discriminatively trained, multiscale, deformable part model. In: 2008 IEEE conference on computer vision and pattern recognition. IEEE. https:\/\/doi.org\/10.1109\/cvpr.2008.4587597","DOI":"10.1109\/cvpr.2008.4587597"},{"key":"18866_CR141","doi-asserted-by":"crossref","unstructured":"Uric\u00e1r M,\u00a0Franc V,\u00a0Hlav\u00e1c V (2015) Facial landmark tracking by tree-based deformable part model based detector. In: Proceedings of the IEEE international conference on computer vision workshops, pp 10\u201317","DOI":"10.1109\/ICCVW.2015.127"},{"key":"18866_CR142","doi-asserted-by":"publisher","unstructured":"Girshick R,\u00a0Donahue J,\u00a0Darrell T,\u00a0Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: 2014 IEEE conference on computer vision and pattern recognition. IEEE. https:\/\/doi.org\/10.1109\/cvpr.2014.81","DOI":"10.1109\/cvpr.2014.81"},{"issue":"6","key":"18866_CR143","doi-asserted-by":"crossref","first-page":"631","DOI":"10.3390\/rs11060631","volume":"11","author":"S Zhang","year":"2019","unstructured":"Zhang S, Wu R, Xu K, Wang J, Sun W (2019) R-cnn-based ship detection from high resolution remote sensing imagery. Remote Sens 11(6):631","journal-title":"Remote Sens"},{"issue":"4","key":"18866_CR144","first-page":"985","volume":"20","author":"J Li","year":"2017","unstructured":"Li J, Liang X, Shen S, Xu T, Feng J, Yan S (2017) Scale-aware fast r-cnn for pedestrian detection. IEEE Trans Multimed Comput 20(4):985\u2013996","journal-title":"IEEE Trans Multimed Comput"},{"key":"18866_CR145","doi-asserted-by":"publisher","unstructured":"Ren S,\u00a0He K,\u00a0Girshick R,\u00a0Sun J (2017) Faster r-CNN: towards real-time object detection with region proposal networks. IEEE transactions on pattern analysis and machine intelligence 39(6):1137\u20131149. [Online]. Available: https:\/\/doi.org\/10.1109\/tpami.2016.2577031","DOI":"10.1109\/tpami.2016.2577031"},{"key":"18866_CR146","doi-asserted-by":"crossref","first-page":"105866","DOI":"10.1016\/j.cmpb.2020.105866","volume":"200","author":"Y Su","year":"2021","unstructured":"Su Y, Li D, Chen X (2021) Lung nodule detection based on faster r-cnn framework. Comput Methods Prog Biomed 200:105866","journal-title":"Comput Methods Prog Biomed"},{"key":"18866_CR147","doi-asserted-by":"crossref","unstructured":"Liu W,\u00a0Anguelov D,\u00a0Erhan D,\u00a0Szegedy C,\u00a0Reed S, Fu C-Y, Berg AC (2016) Ssd: single shot multibox detector. In: Computer vision\u2013ECCV 2016: 14th European conference, Amsterdam, The Netherlands, October 11\u201314, 2016, proceedings, Part I 14. Springer, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"18866_CR148","doi-asserted-by":"crossref","first-page":"102692","DOI":"10.1016\/j.scs.2020.102692","volume":"66","author":"P Nagrath","year":"2021","unstructured":"Nagrath P, Jain R, Madan A, Arora R, Kataria P, Hemanth J (2021) Ssdmnv2: A real time dnn-based face mask detection system using single shot multibox detector and mobilenetv2. Sustain Cities Soc 66:102692","journal-title":"Sustain Cities Soc"},{"key":"18866_CR149","doi-asserted-by":"crossref","first-page":"831","DOI":"10.1016\/j.procs.2018.07.112","volume":"133","author":"S Shinde","year":"2018","unstructured":"Shinde S, Kothari A, Gupta V (2018) Yolo based human action recognition and localization. Procedia Comput Sci 133:831\u2013838","journal-title":"Procedia Comput Sci"},{"key":"18866_CR150","doi-asserted-by":"publisher","unstructured":"Redmon J,\u00a0Farhadi A (2017) Yolo9000: better, faster, stronger. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR). IEEE. https:\/\/doi.org\/10.1109\/cvpr.2017.690","DOI":"10.1109\/cvpr.2017.690"},{"key":"18866_CR151","doi-asserted-by":"crossref","unstructured":"Wu X,\u00a0Sun S,\u00a0Chen N,\u00a0Fu M,\u00a0Hou X (2020) Real-time vehicle color recognition based on yolo9000. In: Communications, signal processing, and systems: proceedings of the 2018 CSPS Volume II: Signal Processing 7th. Springer, pp 82\u201389","DOI":"10.1007\/978-981-13-6504-1_11"},{"key":"18866_CR152","doi-asserted-by":"crossref","first-page":"1347","DOI":"10.1007\/s10044-021-00989-7","volume":"24","author":"C Xianbao","year":"2021","unstructured":"Xianbao C, Guihua Q, Yu J, Zhaomin Z (2021) An improved small object detection method based on yolo v3. Pattern Anal Applic 24:1347\u20131355","journal-title":"Pattern Anal Applic"},{"issue":"1","key":"18866_CR153","doi-asserted-by":"crossref","first-page":"1447","DOI":"10.1038\/s41598-021-81216-5","volume":"11","author":"MO Lawal","year":"2021","unstructured":"Lawal MO (2021) Tomato detection based on modified yolov3 framework. Sci Rep 11(1):1447","journal-title":"Sci Rep"},{"issue":"10","key":"18866_CR154","doi-asserted-by":"crossref","first-page":"3374","DOI":"10.3390\/s21103374","volume":"21","author":"H Liu","year":"2021","unstructured":"Liu H, Fan K, Ouyang Q, Li N (2021) Real-time small drones detection based on pruned yolov4. Sensors 21(10):3374","journal-title":"Sensors"},{"key":"18866_CR155","doi-asserted-by":"crossref","first-page":"106135","DOI":"10.1016\/j.compag.2021.106135","volume":"185","author":"X Hu","year":"2021","unstructured":"Hu X, Liu Y, Zhao Z, Liu J, Yang X, Sun C, Chen S, Li B, Zhou C (2021) Real-time detection of uneaten feed pellets in underwater images for aquaculture using an improved yolo-v4 network. Comput Electron Agric 185:106135","journal-title":"Comput Electron Agric"},{"issue":"10","key":"18866_CR156","doi-asserted-by":"crossref","first-page":"e0259283","DOI":"10.1371\/journal.pone.0259283","volume":"16","author":"W Wu","year":"2021","unstructured":"Wu W, Liu H, Li L, Long Y, Wang X, Wang Z, Li J, Chang Y (2021) Application of local fully convolutional neural network combined with yolo v5 algorithm in small target detection of remote sensing image. PloS one 16(10):e0259283","journal-title":"PloS one"},{"issue":"10","key":"18866_CR157","doi-asserted-by":"crossref","first-page":"e0259283","DOI":"10.1371\/journal.pone.0259283","volume":"16","author":"W Wu","year":"2021","unstructured":"Wu W, Liu H, Li L, Long Y, Wang X, Wang Z, Li J, Chang Y (2021) Application of local fully convolutional neural network combined with yolo v5 algorithm in small target detection of remote sensing image. PloS one 16(10):e0259283","journal-title":"PloS one"},{"key":"18866_CR158","unstructured":"Li C,\u00a0Li L,\u00a0Jiang H,\u00a0Weng K,\u00a0Geng Y,\u00a0Li L,\u00a0Ke Z,\u00a0Li Q,\u00a0Cheng M,\u00a0Nie W et\u00a0al (2022) Yolov6: a single-stage object detection framework for industrial applications. arXiv:2209.02976"},{"issue":"6","key":"18866_CR159","doi-asserted-by":"crossref","first-page":"3161","DOI":"10.3390\/s23063161","volume":"23","author":"S Norkobil Saydirasulovich","year":"2023","unstructured":"Norkobil Saydirasulovich S, Abdusalomov A, Jamil MK, Nasimov R, Kozhamzharova D, Cho Y-I (2023) A yolov6-based improved fire detection approach for smart city environments. Sensors 23(6):3161","journal-title":"Sensors"},{"key":"18866_CR160","doi-asserted-by":"crossref","unstructured":"Zhao H,\u00a0Zhang H,\u00a0Zhao Y (2023) Yolov7-sea: object detection of maritime uav images based on improved yolov7. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp 233\u2013238","DOI":"10.1109\/WACVW58289.2023.00029"},{"issue":"17","key":"18866_CR161","doi-asserted-by":"crossref","first-page":"3612","DOI":"10.3390\/electronics12173612","volume":"12","author":"G Wei","year":"2023","unstructured":"Wei G, Wan F, Zhou W, Xu C, Ye Z, Liu W, Lei G, Xu L (2023) Bfd-yolo: a yolov7-based detection method for building fa\u00e7ade defects. Electronics 12(17):3612","journal-title":"Electronics"},{"key":"18866_CR162","doi-asserted-by":"crossref","unstructured":"Sohan M,\u00a0Sai\u00a0Ram T,\u00a0Reddy R,\u00a0Venkata C (2024) A review on yolov8 and its advancements. In: International conference on data intelligence and cognitive informatics. Springer, pp 529\u2013545","DOI":"10.1007\/978-981-99-7962-2_39"},{"issue":"7","key":"18866_CR163","doi-asserted-by":"crossref","first-page":"226","DOI":"10.4236\/jcc.2023.117014","volume":"11","author":"Z Huang","year":"2023","unstructured":"Huang Z, Li L, Krizek GC, Sun L (2023) Research on traffic sign detection based on improved yolov8. J Comput Commun 11(7):226\u2013232","journal-title":"J Comput Commun"},{"key":"18866_CR164","doi-asserted-by":"crossref","unstructured":"Yi H,\u00a0Liu B,\u00a0Zhao B,\u00a0Liu E (2023) Small object detection algorithm based on improved yolov8 for remote sensing. IEEE J Sel Top Appl Earth Obs Remote Sens","DOI":"10.1109\/JSTARS.2023.3339235"},{"issue":"6","key":"18866_CR165","first-page":"561","volume":"63","author":"A Chaturvedi","year":"2020","unstructured":"Chaturvedi A, Rajpoot V (2020) An optimized deep vision framework. Solid State Technol 63(6):561\u2013569","journal-title":"Solid State Technol"},{"key":"18866_CR166","unstructured":"Lin M,\u00a0Li C,\u00a0Bu X,\u00a0Sun M,\u00a0Lin C,\u00a0Yan J,\u00a0Ouyang W,\u00a0Deng Z (2020) Detr for crowd pedestrian detection. arXiv:2012.06785"},{"issue":"22","key":"18866_CR167","doi-asserted-by":"crossref","first-page":"7057","DOI":"10.1080\/01431161.2023.2277167","volume":"44","author":"M Sivapriya","year":"2023","unstructured":"Sivapriya M, Suresh S (2023) Vit-dexinet: a vision transformer-based edge detection operator for small object detection in sar images. Int J Remote Sens 44(22):7057\u20137084","journal-title":"Int J Remote Sens"},{"key":"18866_CR168","doi-asserted-by":"crossref","unstructured":"Liu Z,\u00a0Lin Y,\u00a0Cao Y,\u00a0Hu H,\u00a0Wei Y,\u00a0Zhang Z,\u00a0Lin S,\u00a0Guo B (2021) Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 10\u00a0012\u201310\u00a0022","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"18866_CR169","doi-asserted-by":"crossref","first-page":"103689","DOI":"10.1016\/j.compind.2022.103689","volume":"140","author":"L Gao","year":"2022","unstructured":"Gao L, Zhang J, Yang C, Zhou Y (2022) Cas-vswin transformer: a variant swin transformer for surface-defect detection. Comput Ind 140:103689","journal-title":"Comput Ind"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18866-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-18866-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18866-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,23]],"date-time":"2024-12-23T12:12:18Z","timestamp":1734955938000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-18866-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,26]]},"references-count":169,"journal-issue":{"issue":"41","published-online":{"date-parts":[[2024,12]]}},"alternative-id":["18866"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-18866-w","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,3,26]]},"assertion":[{"value":"2 January 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 February 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 March 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 March 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"There are no conflicts of interest to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest"}}]}}