{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T00:48:55Z","timestamp":1780447735561,"version":"3.54.1"},"reference-count":407,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2023,6,24]],"date-time":"2023-06-24T00:00:00Z","timestamp":1687564800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,6,24]],"date-time":"2023-06-24T00:00:00Z","timestamp":1687564800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2024,1]]},"DOI":"10.1007\/s11042-023-15981-y","type":"journal-article","created":{"date-parts":[[2023,6,24]],"date-time":"2023-06-24T11:46:34Z","timestamp":1687607194000},"page":"12253-12338","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":57,"title":["A systematic review of object detection from images using deep learning"],"prefix":"10.1007","volume":"83","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8819-7327","authenticated-orcid":false,"given":"Jaskirat","family":"Kaur","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Williamjeet","family":"Singh","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2023,6,24]]},"reference":[{"issue":"3","key":"15981_CR1","doi-asserted-by":"publisher","first-page":"1421","DOI":"10.1007\/s13369-019-03969-6","volume":"45","author":"M Ahmadi","year":"2020","unstructured":"Ahmadi M, Ouarda W, Alimi AM (2020) Efficient and Fast Objects Detection Technique for Intelligent Video Surveillance Using Transfer Learning and Fine-Tuning. Arab J Sci Eng 45(3):1421\u20131433. https:\/\/doi.org\/10.1007\/s13369-019-03969-6","journal-title":"Arab J Sci Eng"},{"issue":"1","key":"15981_CR2","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s13177-019-00178-1","volume":"18","author":"A Alam","year":"2020","unstructured":"Alam A, Jaffery ZA (2020) Indian Traffic Sign Detection and Recognition. Int J Intell Transp Syst Res 18(1):98\u2013112. https:\/\/doi.org\/10.1007\/s13177-019-00178-1","journal-title":"Int J Intell Transp Syst Res"},{"key":"15981_CR3","unstructured":"Alom MZ, Taha TM, Yakopcic C, et al 2018 The History Began from AlexNet: A Comprehensive Survey on Deep Learning Approaches"},{"issue":"2s","key":"15981_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3441656","volume":"17","author":"N An","year":"2021","unstructured":"An N, Qi Yan W (2021) Multitarget Tracking Using Siamese Neural Networks. ACM Trans Multimed Comput Commun Appl 17(2s):1\u201316. https:\/\/doi.org\/10.1145\/3441656","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"15981_CR5","doi-asserted-by":"publisher","unstructured":"Andrianov DE, Eremeev SV and Kuptsov KV 2015 The Review of Spatial Objects Recognition Models and Algorithms. Procedia Eng 129374\u2013379. https:\/\/doi.org\/10.1016\/j.proeng.2015.12.126","DOI":"10.1016\/j.proeng.2015.12.126"},{"key":"15981_CR6","doi-asserted-by":"crossref","unstructured":"Antioquia AMC, Tan DS, Azcarraga A, et al 2018 ZipNet: ZFNet-level Accuracy with 48\u00d7 Fewer Parameters. In: VCIP 2018 - IEEE International Conference on Visual Communications and Image Processing. IEEE, 1\u20134","DOI":"10.1109\/VCIP.2018.8698672"},{"issue":"10","key":"15981_CR7","doi-asserted-by":"publisher","first-page":"3782","DOI":"10.1109\/TITS.2019.2892405","volume":"20","author":"E Arnold","year":"2019","unstructured":"Arnold E, Al-Jarrah OY, Dianati M et al (2019) A Survey on 3D Object Detection Methods for Autonomous Driving Applications. IEEE Trans Intell Transp Syst 20(10):3782\u20133795. https:\/\/doi.org\/10.1109\/TITS.2019.2892405","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"15981_CR8","doi-asserted-by":"publisher","unstructured":"Aslam A and Curry E 2021 A Survey on Object Detection for the Internet of Multimedia Things (IoMT) using Deep Learning and Event-based Middleware: Approaches, Challenges, and Future Directions. Image Vis Comput 106104095. https:\/\/doi.org\/10.1016\/j.imavis.2020.104095","DOI":"10.1016\/j.imavis.2020.104095"},{"key":"15981_CR9","unstructured":"Athanasiadis I, Mousouliotis P and Petrou L 2018 A framework of transfer learning in object detection for embedded systems. arXiv"},{"key":"15981_CR10","doi-asserted-by":"publisher","unstructured":"Ayalew AM, Salau AO, Abeje BT and Enyew B 2022 Detection and classification of COVID-19 disease from X-ray images using convolutional neural networks and histogram of oriented gradients. Biomed Signal Process Control 74(October 2021): 1\u201311. https:\/\/doi.org\/10.1016\/j.bspc.2022.103530","DOI":"10.1016\/j.bspc.2022.103530"},{"key":"15981_CR11","doi-asserted-by":"publisher","unstructured":"Aziz L, Salam MSBH, Sheikh UU and Ayub S 2020 Exploring deep learning-based architecture, strategies, applications and current trends in generic object detection: A comprehensive review. IEEE Access 8170461\u2013170495. https:\/\/doi.org\/10.1109\/ACCESS.2020.3021508","DOI":"10.1109\/ACCESS.2020.3021508"},{"key":"15981_CR12","first-page":"851","volume-title":"In: 2018 21st International Conference on Intelligent Transportation Systems (ITSC)","author":"M Bach","year":"2018","unstructured":"Bach M, Stumper D, Dietmayer K (2018) Deep Convolutional Traffic Light Recognition for Automated Driving. In: In: 2018 21st International Conference on Intelligent Transportation Systems (ITSC). IEEE, pp 851\u2013858"},{"key":"15981_CR13","first-page":"9365","volume-title":"In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Y Baek","year":"2019","unstructured":"Baek Y, Lee B, Han D et al (2019) Character Region Awareness for Text Detection. In: In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp 9365\u20139374"},{"key":"15981_CR14","doi-asserted-by":"publisher","unstructured":"Bamne B, Shrivastava N, Parashar L and Singh U 2020 Transfer learning-based Object Detection by using Convolutional Neural Networks. Proc Int Conf Electron Sustain Commun Syst ICESC 2020 (Icesc): 328\u2013332. https:\/\/doi.org\/10.1109\/ICESC48915.2020.9156060","DOI":"10.1109\/ICESC48915.2020.9156060"},{"key":"15981_CR15","doi-asserted-by":"crossref","unstructured":"Banerjee K, Notz D, Windelen J, et al 2018 Online Camera LiDAR Fusion and Object Detection on Hybrid Data for Autonomous Driving. In: 2018 IEEE Intelligent Vehicles Symposium (IV). IEEE, 1632\u20131638","DOI":"10.1109\/IVS.2018.8500699"},{"key":"15981_CR16","doi-asserted-by":"crossref","unstructured":"Behrendt K, Novak L and Botros R 2017 A deep learning approach to traffic lights: Detection, tracking, and classification. In: 2017 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 1370\u20131377","DOI":"10.1109\/ICRA.2017.7989163"},{"key":"15981_CR17","doi-asserted-by":"crossref","unstructured":"Bergstrom T and Shi H 2020 Human-Object Interaction Detection: A Quick Survey and Examination of Methods Trevor. In: Proceedings of the 1st International Workshop on Human-centric Multimedia Analysis. ACM, New York, NY, USA, 63\u201371","DOI":"10.1145\/3422852.3423481"},{"issue":"3","key":"15981_CR18","doi-asserted-by":"publisher","first-page":"362","DOI":"10.1080\/16168658.2019.1611030","volume":"10","author":"D Bhamare","year":"2018","unstructured":"Bhamare D, Suryawanshi P (2018) Review on Reliable Pattern Recognition with Machine Learning Techniques. Fuzzy Inf Eng 10(3):362\u2013377. https:\/\/doi.org\/10.1080\/16168658.2019.1611030","journal-title":"Fuzzy Inf Eng"},{"key":"15981_CR19","unstructured":"Bochkovskiy A, Wang C and Liao HM 2020 YOLOv4: Optimal Speed and Accuracy of Object Detection"},{"key":"15981_CR20","doi-asserted-by":"crossref","unstructured":"Borisyuk F, Gordo A and Sivakumar V 2018 Rosetta: Large scale system for text detection and recognition in images. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. ACM, New York, NY, USA, 71\u201379","DOI":"10.1145\/3219819.3219861"},{"issue":"2","key":"15981_CR21","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1007\/s41095-019-0149-9","volume":"5","author":"A Borji","year":"2019","unstructured":"Borji A, Cheng M-M, Hou Q et al (2019) Salient object detection: A survey. Comput Vis Media 5(2):117\u2013150. https:\/\/doi.org\/10.1007\/s41095-019-0149-9","journal-title":"Comput Vis Media"},{"key":"15981_CR22","doi-asserted-by":"publisher","unstructured":"Boruah A, Kakoty NM, Ali T (2018) Object Recognition based on Surface Detection-A Review. Procedia Comput Sci 13363\u201374. https:\/\/doi.org\/10.1016\/j.procs.2018.07.009","DOI":"10.1016\/j.procs.2018.07.009"},{"key":"15981_CR23","doi-asserted-by":"crossref","unstructured":"Bouras C and Michos E 2022 An online real-time face recognition system for police purposes. In: 2022 International Conference on Information Networking (ICOIN). IEEE, 62\u201367","DOI":"10.1109\/ICOIN53446.2022.9687212"},{"issue":"8","key":"15981_CR24","doi-asserted-by":"publisher","first-page":"1844","DOI":"10.1109\/TPAMI.2019.2897684","volume":"41","author":"M Braun","year":"2019","unstructured":"Braun M, Krebs S, Flohr F, Gavrila DM (2019) EuroCity Persons: A Novel Benchmark for Person Detection in Traffic Scenes. IEEE Trans Pattern Anal Mach Intell 41(8):1844\u20131861. https:\/\/doi.org\/10.1109\/TPAMI.2019.2897684","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR25","doi-asserted-by":"publisher","unstructured":"Burlina P, Pacheco KD, Joshi N, et al 2017 Comparing humans and deep learning performance for grading AMD: A study in using universal deep features and transfer learning for automated AMD analysis. Comput Biol Med 8280\u201386. https:\/\/doi.org\/10.1016\/j.compbiomed.2017.01.018","DOI":"10.1016\/j.compbiomed.2017.01.018"},{"key":"15981_CR26","doi-asserted-by":"crossref","unstructured":"Caesar H, Bankiti V, Lang AH, et al 2020 nuScenes: A Multimodal Dataset for Autonomous Driving. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 11618\u201311628","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"15981_CR27","doi-asserted-by":"crossref","unstructured":"Cao Z, Simon T, Wei S-E and Sheikh Y 2017 Realtime Multi-person 2D Pose Estimation Using Part Affinity Fields. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 1302\u20131310","DOI":"10.1109\/CVPR.2017.143"},{"key":"15981_CR28","doi-asserted-by":"crossref","unstructured":"Cao Y, Peng H, Wu J, et al 2021 Knowledge-Preserving Incremental Social Event Detection via Heterogeneous GNNs. In: Proceedings of the Web Conference 2021. ACM, New York, NY, USA, 3383\u20133395","DOI":"10.1145\/3442381.3449834"},{"key":"15981_CR29","doi-asserted-by":"crossref","unstructured":"Ch\u2019ng CK and Chan CS 2017 Total-Text: A Comprehensive Dataset for Scene Text Detection and Recognition. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR). IEEE, 935\u2013942","DOI":"10.1109\/ICDAR.2017.157"},{"key":"15981_CR30","unstructured":"Chahal KS and Dey K 2018 A Survey of Modern Object Detection Literature using Deep Learning. arXiv"},{"key":"15981_CR31","doi-asserted-by":"publisher","unstructured":"Chapel MN and Bouwmans T 2020 Moving objects detection with a moving camera: A comprehensive review. Comput Sci Rev 38100310. https:\/\/doi.org\/10.1016\/j.cosrev.2020.100310","DOI":"10.1016\/j.cosrev.2020.100310"},{"key":"15981_CR32","doi-asserted-by":"publisher","unstructured":"Chen Q, Wang P, Cheng A, et al. 2020 Robust one-stage object detection with location-aware classifiers. Pattern Recognit 105. https:\/\/doi.org\/10.1016\/j.patcog.2020.107334","DOI":"10.1016\/j.patcog.2020.107334"},{"key":"15981_CR33","doi-asserted-by":"crossref","unstructured":"Chen Y, Wang W, Zhou Y, et al 2021 Self-Training for Domain Adaptive Scene Text Detection. In: 2020 25th International Conference on Pattern Recognition (ICPR). IEEE, 850\u2013857","DOI":"10.1109\/ICPR48806.2021.9412558"},{"issue":"4","key":"15981_CR34","doi-asserted-by":"publisher","first-page":"1121","DOI":"10.1007\/s11263-020-01412-0","volume":"129","author":"Z Chen","year":"2021","unstructured":"Chen Z, Ouyang W, Liu T, Tao D (2021) A Shape Transformation-based Dataset Augmentation Framework for Pedestrian Detection. Int J Comput Vis 129(4):1121\u20131138. https:\/\/doi.org\/10.1007\/s11263-020-01412-0","journal-title":"Int J Comput Vis"},{"issue":"1","key":"15981_CR35","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1080\/07038992.2021.1894915","volume":"47","author":"Z Chen","year":"2021","unstructured":"Chen Z, Luo R, Li J et al (2021) U-Net Based Road Area Guidance for Crosswalks Detection from Remote Sensing Images. Can J Remote Sens 47(1):83\u201399. https:\/\/doi.org\/10.1080\/07038992.2021.1894915","journal-title":"Can J Remote Sens"},{"key":"15981_CR36","doi-asserted-by":"publisher","unstructured":"Chen J, Bai S, Wan G, Li Y (2023) Research on YOLOv7-based defect detection method for automotive running lights. Syst Sci Control Eng 11(1). https:\/\/doi.org\/10.1080\/21642583.2023.2185916","DOI":"10.1080\/21642583.2023.2185916"},{"key":"15981_CR37","doi-asserted-by":"publisher","unstructured":"Cheng G and Han J 2016 A survey on object detection in optical remote sensing images. ISPRS J Photogramm Remote Sens 11711\u201328. https:\/\/doi.org\/10.1016\/j.isprsjprs.2016.03.014","DOI":"10.1016\/j.isprsjprs.2016.03.014"},{"key":"15981_CR38","doi-asserted-by":"publisher","unstructured":"Cheng M, Su J, Li L and Zhou X 2020 A-DFPN: Adversarial Learning and Deformation Feature Pyramid Networks for Object Detection. 2020 IEEE 5th Int Conf Image, Vis Comput ICIVC 2020 11\u201318. https:\/\/doi.org\/10.1109\/ICIVC50857.2020.9177437","DOI":"10.1109\/ICIVC50857.2020.9177437"},{"key":"15981_CR39","doi-asserted-by":"publisher","unstructured":"Chetouane A, Mabrouk S, Jemili I and Mosbah M 2020 Vision-based vehicle detection for road traffic congestion classification. Concurr Comput (July): 1\u201327. https:\/\/doi.org\/10.1002\/cpe.5983","DOI":"10.1002\/cpe.5983"},{"issue":"2","key":"15981_CR40","doi-asserted-by":"publisher","first-page":"222","DOI":"10.1016\/j.icte.2021.12.016","volume":"9","author":"JD Choi","year":"2023","unstructured":"Choi JD, Kim MY (2023) A sensor fusion system with thermal infrared camera and LiDAR for autonomous vehicles and deep learning based object detection. ICT Express 9(2):222\u2013227. https:\/\/doi.org\/10.1016\/j.icte.2021.12.016","journal-title":"ICT Express"},{"issue":"2","key":"15981_CR41","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1016\/j.cviu.2011.10.007","volume":"116","author":"J Choi","year":"2012","unstructured":"Choi J, Chang HJ, Yoo YJ, Choi JY (2012) Robust moving object detection against fast illumination change. Comput Vis Image Underst 116(2):179\u2013193. https:\/\/doi.org\/10.1016\/j.cviu.2011.10.007","journal-title":"Comput Vis Image Underst"},{"key":"15981_CR42","doi-asserted-by":"publisher","unstructured":"Cole JH, Poudel RPK, Tsagkrasoulis D, et al 2017 Predicting brain age with deep learning from raw imaging data results in a reliable and heritable biomarker. Neuroimage 163115\u2013124. https:\/\/doi.org\/10.1016\/j.neuroimage.2017.07.059","DOI":"10.1016\/j.neuroimage.2017.07.059"},{"key":"15981_CR43","doi-asserted-by":"crossref","unstructured":"Cordts M, Omran M, Ramos S, et al 2016 The Cityscapes Dataset for Semantic Urban Scene Understanding. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 3213\u20133223","DOI":"10.1109\/CVPR.2016.350"},{"key":"15981_CR44","unstructured":"Dai J, Li Y, He K and Sun J 2016 R-FCN: Object Detection via Region-based Fully Convolutional Networks. Adv Neural Inf Process Syst 379\u2013387"},{"key":"15981_CR45","doi-asserted-by":"crossref","unstructured":"Dai J, Qi H, Xiong Y, et al 2017 Deformable Convolutional Networks. In: 2017 IEEE International Conference on Computer Vision (ICCV). IEEE, 764\u2013773","DOI":"10.1109\/ICCV.2017.89"},{"key":"15981_CR46","doi-asserted-by":"crossref","unstructured":"Dalal N and Triggs B 2005 Histograms of Oriented Gradients for Human Detection. In: 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905). IEEE, 886\u2013893","DOI":"10.1109\/CVPR.2005.177"},{"key":"15981_CR47","doi-asserted-by":"publisher","unstructured":"De Cesaro J\u00fanior T and Rieder R 2020 Automatic identification of insects from digital images: A survey. Comput Electron Agric 178(September): 105784. https:\/\/doi.org\/10.1016\/j.compag.2020.105784","DOI":"10.1016\/j.compag.2020.105784"},{"key":"15981_CR48","doi-asserted-by":"crossref","unstructured":"de Charette R and Nashashibi F 2009 Traffic light recognition using image processing compared to learning processes. In: 2009 IEEE\/RSJ International Conference on Intelligent Robots and Systems. IEEE, 333\u2013338","DOI":"10.1109\/IROS.2009.5353941"},{"key":"15981_CR49","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, et al 2009 ImageNet: A large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition. IEEE, 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"issue":"June","key":"15981_CR50","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.isprsjprs.2018.04.003","volume":"145","author":"Z Deng","year":"2018","unstructured":"Deng Z, Sun H, Zhou S et al (2018) Multi-scale object detection in remote sensing imagery with convolutional neural networks. ISPRS J Photogramm Remote Sens 145(June):1\u201321. https:\/\/doi.org\/10.1016\/j.isprsjprs.2018.04.003","journal-title":"ISPRS J Photogramm Remote Sens"},{"issue":"4","key":"15981_CR51","doi-asserted-by":"publisher","first-page":"673","DOI":"10.1049\/iet-ipr.2018.5985","volume":"13","author":"B Dey","year":"2019","unstructured":"Dey B, Kundu MK (2019) Turning video into traffic data - An application to urban intersection analysis using transfer learning. IET Image Process 13(4):673\u2013679. https:\/\/doi.org\/10.1049\/iet-ipr.2018.5985","journal-title":"IET Image Process"},{"issue":"2","key":"15981_CR52","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1007\/s13748-019-00203-0","volume":"9","author":"A Dhillon","year":"2020","unstructured":"Dhillon A, Verma GK (2020) Convolutional neural network: a review of models, methodologies and applications to object detection. Prog Artif Intell 9(2):85\u2013112. https:\/\/doi.org\/10.1007\/s13748-019-00203-0","journal-title":"Prog Artif Intell"},{"issue":"June 2017","key":"15981_CR53","doi-asserted-by":"publisher","first-page":"208","DOI":"10.1016\/j.isprsjprs.2018.05.005","volume":"141","author":"P Ding","year":"2018","unstructured":"Ding P, Zhang Y, Deng W-J et al (2018) A light and faster regional convolutional neural network for object detection in optical remote sensing images. ISPRS J Photogramm Remote Sens 141(June 2017):208\u2013218. https:\/\/doi.org\/10.1016\/j.isprsjprs.2018.05.005","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"15981_CR54","doi-asserted-by":"crossref","unstructured":"Dollar P, Wojek C, Schiele B and Perona P 2009 Pedestrian detection: A benchmark. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition. IEEE, 304\u2013311","DOI":"10.1109\/CVPR.2009.5206631"},{"key":"15981_CR55","doi-asserted-by":"crossref","unstructured":"Dollar P, Wojek C, Schiele B and Perona P 2012 Pedestrian Detection: An Evaluation of the State of the Art. In: IEEE Transactions on Pattern Analysis and Machine Intelligence. 743\u2013761","DOI":"10.1109\/TPAMI.2011.155"},{"key":"15981_CR56","doi-asserted-by":"crossref","unstructured":"Dominguez-Sanchez A, Orts-Escolano S, Garcia-Rodriguez J and Cazorla M 2018 A New Dataset and Performance Evaluation of a Region-based CNN for Urban Object Detection. In: 2018 International Joint Conference on Neural Networks (IJCNN). IEEE, 1\u20138","DOI":"10.1109\/IJCNN.2018.8489478"},{"issue":"22","key":"15981_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/cpe.4655","volume":"30","author":"M Du","year":"2018","unstructured":"Du M (2018) Mobile payment recognition technology based on face detection algorithm. Concurr Comput 30(22):1\u20139. https:\/\/doi.org\/10.1002\/cpe.4655","journal-title":"Concurr Comput"},{"issue":"00","key":"15981_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1080\/17517575.2020.1791363","volume":"00","author":"F Du","year":"2020","unstructured":"Du F, Wang WL, Zhang Z (2020) Pedestrian detection based on a hybrid Gaussian model and support vector machine. Enterp Inf Syst 00(00):1\u201312. https:\/\/doi.org\/10.1080\/17517575.2020.1791363","journal-title":"Enterp Inf Syst"},{"key":"15981_CR59","doi-asserted-by":"crossref","unstructured":"Duan J, Xu Y, Kuang Z, et al 2019 Geometry Normalization Networks for Accurate Scene Text Detection. In: 2019 IEEE\/CVF International Conference on Computer Vision (ICCV). IEEE, 9137\u20139146","DOI":"10.1109\/ICCV.2019.00923"},{"issue":"8","key":"15981_CR60","doi-asserted-by":"publisher","first-page":"3329","DOI":"10.1002\/mp.13620","volume":"46","author":"MS Elmahdy","year":"2019","unstructured":"Elmahdy MS, Jagt T, Zinkstok RT et al (2019) Robust contour propagation using deep learning and image registration for online adaptive proton therapy of prostate cancer. Med Phys 46(8):3329\u20133343. https:\/\/doi.org\/10.1002\/mp.13620","journal-title":"Med Phys"},{"key":"15981_CR61","unstructured":"Ertler C, Mislej J, Ollmann T et al (2019) The Mapillary Traffic Sign Dataset for Detection and Classification on a Global Scale. Comput Vis Pattern Recognit:1\u201317"},{"issue":"1","key":"15981_CR62","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham M, Eslami SMA, Van Gool L et al (2015) The Pascal Visual Object Classes Challenge: A Retrospective. Int J Comput Vis 111(1):98\u2013136. https:\/\/doi.org\/10.1007\/s11263-014-0733-5","journal-title":"Int J Comput Vis"},{"key":"15981_CR63","doi-asserted-by":"crossref","unstructured":"Fan DP, Wang W, Cheng MM and Shen J 2019 Shifting more attention to video salient object detection. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition. 8546\u20138556","DOI":"10.1109\/CVPR.2019.00875"},{"key":"15981_CR64","doi-asserted-by":"crossref","unstructured":"Fan D, Fang S, Liu X, et al 2019 A multi-scale face detection algorithm based on improved SSD model. In: Proceedings of the ACM Turing Celebration Conference - China. ACM, New York, NY, USA, 1\u20139","DOI":"10.1145\/3321408.3321419"},{"key":"15981_CR65","doi-asserted-by":"crossref","unstructured":"Fan D-P, Ji G-P, Zhou T, et al 2020 PraNet: Parallel Reverse Attention Network for Polyp Segmentation. In: The Legal Literature of Accounting. 263\u2013273","DOI":"10.1007\/978-3-030-59725-2_26"},{"issue":"8","key":"15981_CR66","doi-asserted-by":"publisher","first-page":"2626","DOI":"10.1109\/TMI.2020.2996645","volume":"39","author":"DP Fan","year":"2020","unstructured":"Fan DP, Zhou T, Ji GP et al (2020) Inf-Net: Automatic COVID-19 Lung Infection Segmentation from CT Images. IEEE Trans Med Imaging 39(8):2626\u20132637. https:\/\/doi.org\/10.1109\/TMI.2020.2996645","journal-title":"IEEE Trans Med Imaging"},{"key":"15981_CR67","doi-asserted-by":"publisher","unstructured":"Fang F, Li L, Gu Y et al (2020) A novel hybrid approach for crack detection. Pattern Recogn 107. https:\/\/doi.org\/10.1016\/j.patcog.2020.107474","DOI":"10.1016\/j.patcog.2020.107474"},{"key":"15981_CR68","doi-asserted-by":"publisher","unstructured":"Fernandes D, Silva A, N\u00e9voa R, et al 2021 Point-cloud based 3D object detection and classification methods for self-driving applications: A survey and taxonomy. Inf Fusion 68161\u2013191. https:\/\/doi.org\/10.1016\/j.inffus.2020.11.002","DOI":"10.1016\/j.inffus.2020.11.002"},{"key":"15981_CR69","doi-asserted-by":"crossref","unstructured":"Fregin A, Muller J, Krebel U and Dietmayer K 2018 The DriveU Traffic Light Dataset: Introduction and Comparison with Existing Datasets. In: 2018 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 3376\u20133383","DOI":"10.1109\/ICRA.2018.8460737"},{"key":"15981_CR70","unstructured":"Fu C, Liu W, Ranga A, et al. 2017 DSSD: Deconvolutional Single Shot Detector"},{"issue":"January","key":"15981_CR71","doi-asserted-by":"publisher","first-page":"294","DOI":"10.1016\/j.isprsjprs.2020.01.025","volume":"161","author":"K Fu","year":"2020","unstructured":"Fu K, Chang Z, Zhang Y et al (2020) Rotation-aware and multi-scale convolutional neural network for object detection in remote sensing images. ISPRS J Photogramm Remote Sens 161(January):294\u2013308. https:\/\/doi.org\/10.1016\/j.isprsjprs.2020.01.025","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"15981_CR72","doi-asserted-by":"publisher","unstructured":"Gao X, Li W, Loomes M and Wang L 2017 A fused deep learning architecture for viewpoint classification of echocardiography. Inf Fusion 36103\u2013113. https:\/\/doi.org\/10.1016\/j.inffus.2016.11.007","DOI":"10.1016\/j.inffus.2016.11.007"},{"key":"15981_CR73","doi-asserted-by":"publisher","unstructured":"Gawande U, Hajari K and Golhar Y 2022 SIRA: Scale illumination rotation affine invariant mask R-CNN for pedestrian detection. Appl Intell. https:\/\/doi.org\/10.1007\/s10489-021-03073-z","DOI":"10.1007\/s10489-021-03073-z"},{"key":"15981_CR74","doi-asserted-by":"publisher","unstructured":"Gawande U, Hajari K and Golhar Y 2023 Real-Time Deep Learning Approach for Pedestrian Detection and Suspicious Activity Recognition. Procedia Comput Sci 2182438\u20132447. https:\/\/doi.org\/10.1016\/j.procs.2023.01.219","DOI":"10.1016\/j.procs.2023.01.219"},{"key":"15981_CR75","doi-asserted-by":"publisher","unstructured":"Ge C, Wang J, Wang J, et al 2020 Towards automatic visual inspection: A weakly supervised learning method for industrial applicable object detection. Comput Ind 121103232. https:\/\/doi.org\/10.1016\/j.compind.2020.103232","DOI":"10.1016\/j.compind.2020.103232"},{"key":"15981_CR76","doi-asserted-by":"publisher","unstructured":"Ge Z, Wang J, Huang X, et al 2021 LLA: Loss-aware label assignment for dense pedestrian detection. Neurocomputing 462272\u2013281. https:\/\/doi.org\/10.1016\/j.neucom.2021.07.094","DOI":"10.1016\/j.neucom.2021.07.094"},{"key":"15981_CR77","doi-asserted-by":"crossref","unstructured":"Geiger A, Lenz P and Urtasun R 2012 Are we ready for autonomous driving? The KITTI vision benchmark suite. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition. IEEE, 3354\u20133361","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"15981_CR78","doi-asserted-by":"crossref","unstructured":"Ghiasi G, Lin T-Y and Le Q V. 2019 NAS-FPN: Learning Scalable Feature Pyramid Architecture for Object Detection. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 7029\u20137038","DOI":"10.1109\/CVPR.2019.00720"},{"key":"15981_CR79","doi-asserted-by":"crossref","unstructured":"Girshick R 2015 Fast R-CNN. In: 2015 IEEE International Conference on Computer Vision (ICCV). IEEE, 1440\u20131448","DOI":"10.1109\/ICCV.2015.169"},{"key":"15981_CR80","doi-asserted-by":"crossref","unstructured":"Girshick R, Donahue J, Darrell T and Malik J 2014 Rich Feature Hierarchies for Accurate Object Detection and Semantic Segmentation. In: 2014 IEEE Conference on Computer Vision and Pattern Recognition. IEEE, 580\u2013587","DOI":"10.1109\/CVPR.2014.81"},{"issue":"1","key":"15981_CR81","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1109\/TPAMI.2015.2437384","volume":"38","author":"R Girshick","year":"2015","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2015) Region-Based Convolutional Networks for Accurate Object Detection and Segmentation. IEEE Trans Pattern Anal Mach Intell 38(1):142\u2013158. https:\/\/doi.org\/10.1109\/TPAMI.2015.2437384","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR82","doi-asserted-by":"crossref","unstructured":"Goldman E, Herzig R, Eisenschtat A et al (2019) Precise Detection in Densely Packed Scenes. Comput Speech Lang 68101200","DOI":"10.1109\/CVPR.2019.00537"},{"key":"15981_CR83","doi-asserted-by":"crossref","unstructured":"Grosicki E, El-Abed H 2011 ICDAR 2011 - French Handwriting Recognition Competition. In: 2011 International Conference on Document Analysis and Recognition. IEEE, 1459\u20131463","DOI":"10.1109\/ICDAR.2011.290"},{"issue":"12","key":"15981_CR84","doi-asserted-by":"publisher","first-page":"2319","DOI":"10.1049\/iet-ipr.2018.5245","volume":"12","author":"WH Gu","year":"2018","unstructured":"Gu WH, Zhu Y, Chen XD et al (2018) Hierarchical CNN-based real-time fatigue detection system by visual-based technologies using MSP model. IET Image Process 12(12):2319\u20132329. https:\/\/doi.org\/10.1049\/iet-ipr.2018.5245","journal-title":"IET Image Process"},{"issue":"January","key":"15981_CR85","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2021.103170","volume":"204","author":"Z Guo","year":"2021","unstructured":"Guo Z, Yang G, Chen J, Sun X (2021) Fake face detection via adaptive manipulation traces extraction network. Comput Vis Image Underst 204(January):103170. https:\/\/doi.org\/10.1016\/j.cviu.2021.103170","journal-title":"Comput Vis Image Underst"},{"key":"15981_CR86","doi-asserted-by":"publisher","unstructured":"Guo Z, Liao W, Xiao Y, et al 2021 Weak segmentation supervised deep neural networks for pedestrian detection. Pattern Recognit 119108063. https:\/\/doi.org\/10.1016\/j.patcog.2021.108063","DOI":"10.1016\/j.patcog.2021.108063"},{"key":"15981_CR87","doi-asserted-by":"publisher","unstructured":"Gupta A, Anpalagan A, Guan L and Khwaja AS 2021 Deep learning for object detection and scene perception in self-driving cars: Survey, challenges, and open issues. Array 10(September 2020): 100057. https:\/\/doi.org\/10.1016\/j.array.2021.100057","DOI":"10.1016\/j.array.2021.100057"},{"issue":"3","key":"15981_CR88","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1007\/s00371-020-01814-8","volume":"37","author":"S Gupta","year":"2021","unstructured":"Gupta S, Thakur K, Kumar M (2021) 2D-human face recognition using SIFT and SURF descriptors of face\u2019s feature regions. Vis Comput 37(3):447\u2013456. https:\/\/doi.org\/10.1007\/s00371-020-01814-8","journal-title":"Vis Comput"},{"key":"15981_CR89","doi-asserted-by":"crossref","unstructured":"Han K, Wang Y, Tian Q, et al. 2020 GhostNet: More Features From Cheap Operations. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 1577\u20131586","DOI":"10.1109\/CVPR42600.2020.00165"},{"key":"15981_CR90","doi-asserted-by":"crossref","unstructured":"Han J, Ding J, Xue N and Xia G-S 2021 ReDet: A Rotation-equivariant Detector for Aerial Object Detection. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 2785\u20132794","DOI":"10.1109\/CVPR46437.2021.00281"},{"key":"15981_CR91","doi-asserted-by":"publisher","unstructured":"Hangaragi S, Singh T and Neelima N 2023 Face Detection and Recognition Using Face Mesh and Deep Neural Network. Procedia Comput Sci 218741\u2013749. https:\/\/doi.org\/10.1016\/j.procs.2023.01.054","DOI":"10.1016\/j.procs.2023.01.054"},{"key":"15981_CR92","doi-asserted-by":"crossref","unstructured":"Hanyao M, Jin Y, Qian Z, et al 2021 Edge-assisted Online On-device Object Detection for Real-time Video Analytics. In: IEEE INFOCOM 2021 - IEEE Conference on Computer Communications. IEEE, 1\u201310","DOI":"10.1109\/INFOCOM42981.2021.9488741"},{"key":"15981_CR93","doi-asserted-by":"crossref","unstructured":"Hao Z, Liu Y, Qin H, et al. 2017 Scale-Aware Face Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 1913\u20131922","DOI":"10.1109\/CVPR.2017.207"},{"issue":"4","key":"15981_CR94","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1177\/0165551517698564","volume":"44","author":"M Hasan","year":"2018","unstructured":"Hasan M, Orgun MA, Schwitter R (2018) A survey on real-time event detection from the Twitter data stream. J Inf Sci 44(4):443\u2013463. https:\/\/doi.org\/10.1177\/0165551517698564","journal-title":"J Inf Sci"},{"issue":"9","key":"15981_CR95","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial Pyramid Pooling in Deep Convolutional Networks for Visual Recognition. IEEE Trans Pattern Anal Mach Intell 37(9):1904\u20131916. https:\/\/doi.org\/10.1109\/TPAMI.2015.2389824","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR96","doi-asserted-by":"publisher","unstructured":"He K, Zhang X, Ren S and Sun J 2016 Deep residual learning for image recognition. Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 2016-Decem770\u2013778. https:\/\/doi.org\/10.1109\/CVPR.2016.90","DOI":"10.1109\/CVPR.2016.90"},{"key":"15981_CR97","doi-asserted-by":"crossref","unstructured":"He S, Liang G, Chen F, et al 2018 Object Recognition and 3D Pose Estimation Using Improved VGG16 Deep Neural Network in Cluttered Scenes. In: Proceedings of the International Conference on Information Technology and Electrical Engineering 2018. ACM, New York, NY, USA, pp. 1\u20137","DOI":"10.1145\/3148453.3306266"},{"issue":"2","key":"15981_CR98","doi-asserted-by":"publisher","first-page":"386","DOI":"10.1109\/TPAMI.2018.284","volume":"42","author":"K He","year":"2020","unstructured":"He K, Gkioxari G, Dollar P, Girshick R (2020) Mask R-CNN. IEEE Trans Pattern Anal Mach Intell 42(2):386\u2013397. https:\/\/doi.org\/10.1109\/TPAMI.2018.284","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR99","doi-asserted-by":"publisher","unstructured":"He W, Zhang X-Y, Yin F, et al 2020 Realtime multi-scale scene text detection with scale-based region proposal network. Pattern Recognit 981\u201314. https:\/\/doi.org\/10.1016\/j.patcog.2019.107026","DOI":"10.1016\/j.patcog.2019.107026"},{"issue":"5","key":"15981_CR100","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1049\/iet-its.2019.0409","volume":"14","author":"Z He","year":"2020","unstructured":"He Z, Nan F, Li X et al (2020) Traffic sign recognition by combining global and local features based on semi-supervised classification. IET Intell Transp Syst 14(5):323\u2013330. https:\/\/doi.org\/10.1049\/iet-its.2019.0409","journal-title":"IET Intell Transp Syst"},{"key":"15981_CR101","doi-asserted-by":"crossref","unstructured":"Hechun W and Xiaohong Z 2019 Survey of Deep Learning Based Object Detection. In: Proceedings of the 2nd International Conference on Big Data Technologies - ICBDT2019. ACM Press, New York, New York, USA, pp. 149\u2013153","DOI":"10.1145\/3358528.3358574"},{"key":"15981_CR102","first-page":"30","volume-title":"European Conference on Computer Vision","author":"G Heitz","year":"2008","unstructured":"Heitz G, Koller D (2008) Learning Spatial Context: Using Stuff to Find Things. In: European Conference on Computer Vision. Springer, Berlin, Heidelberg, pp 30\u201343"},{"key":"15981_CR103","first-page":"282","volume":"1","author":"GE Hinton","year":"1986","unstructured":"Hinton GE, Sejnowski TE (1986) Learning and relearning in Boltzmann machines. In Parallel Distributed Processing. Parallel Distrib Process 1:282\u2013317","journal-title":"Parallel Distrib Process"},{"issue":"1","key":"15981_CR104","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1007\/s00779-020-01419-x","volume":"25","author":"HA Hosni Mahmoud","year":"2021","unstructured":"Hosni Mahmoud HA, Mengash HA (2021) A novel technique for automated concealed face detection in surveillance videos. Pers Ubiquit Comput 25(1):129\u2013140. https:\/\/doi.org\/10.1007\/s00779-020-01419-x","journal-title":"Pers Ubiquit Comput"},{"key":"15981_CR105","doi-asserted-by":"crossref","unstructured":"Houben S, Stallkamp J, Salmen J, et al 2013 Detection of traffic signs in real-world images: The German traffic sign detection benchmark. In: The 2013 International Joint Conference on Neural Networks (IJCNN). IEEE, 1\u20138","DOI":"10.1109\/IJCNN.2013.6706807"},{"key":"15981_CR106","doi-asserted-by":"crossref","unstructured":"Hu P and Ramanan D 2017 Finding Tiny Faces. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 1522\u20131530","DOI":"10.1109\/CVPR.2017.166"},{"key":"15981_CR107","doi-asserted-by":"publisher","unstructured":"Hu K, Yang W and Gao X 2017 Microcalcification diagnosis in digital mammography using extreme learning machine based on hidden Markov tree model of dual-tree complex wavelet transform. Expert Syst Appl 86135\u2013144. https:\/\/doi.org\/10.1016\/j.eswa.2017.05.062","DOI":"10.1016\/j.eswa.2017.05.062"},{"key":"15981_CR108","doi-asserted-by":"crossref","unstructured":"Hu Y, Wu X, Zheng G and Liu X 2019 Object Detection of UAV for Anti-UAV Based on Improved YOLO v3. In: 2019 Chinese Control Conference (CCC). IEEE, pp. 8386\u20138390","DOI":"10.23919\/ChiCC.2019.8865525"},{"issue":"8","key":"15981_CR109","doi-asserted-by":"publisher","first-page":"2011","DOI":"10.1109\/TPAMI.2019.2913372","volume":"42","author":"J Hu","year":"2020","unstructured":"Hu J, Shen L, Albanie S et al (2020) Squeeze-and-Excitation Networks. IEEE Trans Pattern Anal Mach Intell 42(8):2011\u20132023. https:\/\/doi.org\/10.1109\/TPAMI.2019.2913372","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR110","doi-asserted-by":"crossref","unstructured":"Hu J, Zhao Y and Zhang X 2020 Application of Transfer Learning in Infrared Pedestrian Detection. In: 2020 IEEE 5th International Conference on Image, Vision and Computing (ICIVC). IEEE, pp. 1\u20134","DOI":"10.1109\/ICIVC50857.2020.9177438"},{"key":"15981_CR111","doi-asserted-by":"publisher","unstructured":"Hua X, Wang X, Rui T, et al 2020 A fast self-attention cascaded network for object detection in large scene remote sensing images. Appl Soft Comput 94106495. https:\/\/doi.org\/10.1016\/j.asoc.2020.106495","DOI":"10.1016\/j.asoc.2020.106495"},{"key":"15981_CR112","doi-asserted-by":"crossref","unstructured":"Huang J, Rathod V, Sun C, et al 2017 Speed\/Accuracy Trade-Offs for Modern Convolutional Object Detectors. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 3296\u20133297","DOI":"10.1109\/CVPR.2017.351"},{"key":"15981_CR113","doi-asserted-by":"publisher","unstructured":"Huang H, Zhou H, Yang X, et al 2019 Faster R-CNN for marine organisms detection and recognition using data augmentation. Neurocomputing 337372\u2013384. https:\/\/doi.org\/10.1016\/j.neucom.2019.01.084","DOI":"10.1016\/j.neucom.2019.01.084"},{"issue":"10","key":"15981_CR114","doi-asserted-by":"publisher","first-page":"2338","DOI":"10.1109\/TMI.2019.2906677","volume":"38","author":"W Huang","year":"2019","unstructured":"Huang W, Luo M, Liu X et al (2019) Arterial Spin Labeling Images Synthesis from sMRI Using Unbalanced Deep Discriminant Learning. IEEE Trans Med Imaging 38(10):2338\u20132351. https:\/\/doi.org\/10.1109\/TMI.2019.2906677","journal-title":"IEEE Trans Med Imaging"},{"key":"15981_CR115","doi-asserted-by":"publisher","unstructured":"Huang Z, Chen K, He J, et al 2019 ICDAR2019 competition on scanned receipt OCR and information extraction. Proc Int Conf Doc Anal Recognition, ICDAR 1516\u20131520. https:\/\/doi.org\/10.1109\/ICDAR.2019.00244","DOI":"10.1109\/ICDAR.2019.00244"},{"key":"15981_CR116","doi-asserted-by":"crossref","unstructured":"Huang Q, Wang D, Dong Z, et al 2021 CoDeNet: Efficient Deployment of Input-Adaptive Object Detection on Embedded FPGAs. In: The 2021 ACM\/SIGDA International Symposium on Field-Programmable Gate Arrays. ACM, New York, NY, USA, pp. 206\u2013216","DOI":"10.1145\/3431920.3439295"},{"key":"15981_CR117","doi-asserted-by":"publisher","unstructured":"Huang Q, Cai Z and Lan T 2021 A Single Neural Network for Mixed Style License Plate Detection and Recognition. IEEE Access 921777\u201321785. https:\/\/doi.org\/10.1109\/ACCESS.2021.3055243","DOI":"10.1109\/ACCESS.2021.3055243"},{"key":"15981_CR118","doi-asserted-by":"crossref","unstructured":"Hung BT 2021 Face Recognition Using Hybrid HOG-CNN Approach. In: International Journal of Image and Graphics. Springer, pp. 715\u2013723","DOI":"10.1007\/978-981-15-7527-3_67"},{"issue":"2","key":"15981_CR119","doi-asserted-by":"publisher","first-page":"116","DOI":"10.1007\/s42979-020-00125-y","volume":"1","author":"GL Hung","year":"2020","unstructured":"Hung GL, Bin SMS, Samma H et al (2020) Faster R-CNN Deep Learning Model for Pedestrian Detection from Drone Images. SN Comput Sci 1(2):116. https:\/\/doi.org\/10.1007\/s42979-020-00125-y","journal-title":"SN Comput Sci"},{"key":"15981_CR120","doi-asserted-by":"crossref","unstructured":"Irbaz MS, Al Nasim MA and Ferdous RE 2022 Real-time Face Recognition System for Remote Employee Tracking. In: Lecture Notes on Data Engineering and Communications Technologies. Springer, 153\u2013163","DOI":"10.1007\/978-981-16-6636-0_13"},{"key":"15981_CR121","doi-asserted-by":"crossref","unstructured":"Iva\u0161i\u0107-Kos M, Kri\u0161to M and Pobar M 2019 Human Detection in Thermal Imaging Using YOLO. In: Proceedings of the 2019 5th International Conference on Computer and Technology Applications. ACM, New York, NY, USA, pp. 20\u201324","DOI":"10.1145\/3323933.3324076"},{"key":"15981_CR122","unstructured":"Jaderberg M, Simonyan K, Vedaldi A and Zisserman A 2014 Synthetic Data and Artificial Neural Networks for Natural Scene Text Recognition, pp. 1\u201310"},{"issue":"5","key":"15981_CR123","doi-asserted-by":"publisher","first-page":"1301","DOI":"10.1007\/s11554-019-00888-5","volume":"17","author":"D Jaiswal","year":"2020","unstructured":"Jaiswal D, Kumar P (2020) Real-time implementation of moving object detection in UAV videos using GPUs. J Real-Time Image Proc 17(5):1301\u20131317. https:\/\/doi.org\/10.1007\/s11554-019-00888-5","journal-title":"J Real-Time Image Proc"},{"issue":"1","key":"15981_CR124","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1016\/j.icte.2020.07.008","volume":"7","author":"Y Jamtsho","year":"2021","unstructured":"Jamtsho Y, Riyamongkol P, Waranusast R (2021) Real-time license plate detection for non-helmeted motorcyclist using YOLO. ICT Express 7(1):104\u2013109. https:\/\/doi.org\/10.1016\/j.icte.2020.07.008","journal-title":"ICT Express"},{"key":"15981_CR125","doi-asserted-by":"crossref","unstructured":"Jani D and Mankodia A 2021 Comprehensive Analysis of Object Detection And Tracking Methodologies From Surveillance Videos. In: 2021 5th International Conference on Computing Methodologies and Communication (ICCMC). IEEE, pp. 963\u2013970","DOI":"10.1109\/ICCMC51019.2021.9418373"},{"issue":"1","key":"15981_CR126","doi-asserted-by":"publisher","first-page":"243","DOI":"10.1080\/21642583.2019.1647576","volume":"7","author":"M Jiafa","year":"2019","unstructured":"Jiafa M, Weifeng W, Yahong H, Weiguo S (2019) A scene recognition algorithm based on deep residual network. Syst Sci Control Eng 7(1):243\u2013251. https:\/\/doi.org\/10.1080\/21642583.2019.1647576","journal-title":"Syst Sci Control Eng"},{"issue":"November","key":"15981_CR127","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.114219","volume":"168","author":"M Jian","year":"2021","unstructured":"Jian M, Wang J, Yu H et al (2021) Visual saliency detection by integrating spatial position prior of object with background cues. Expert Syst Appl 168(November):114219. https:\/\/doi.org\/10.1016\/j.eswa.2020.114219","journal-title":"Expert Syst Appl"},{"issue":"3","key":"15981_CR128","doi-asserted-by":"publisher","first-page":"1361","DOI":"10.1109\/TIP.2017.2779856","volume":"27","author":"Z Jiang","year":"2018","unstructured":"Jiang Z, Huynh DQ (2018) Multiple Pedestrian Tracking From Monocular Videos in an Interacting Multiple Model Framework. IEEE Trans Image Process 27(3):1361\u20131375. https:\/\/doi.org\/10.1109\/TIP.2017.2779856","journal-title":"IEEE Trans Image Process"},{"key":"15981_CR129","doi-asserted-by":"crossref","unstructured":"Jiang S, Jin H and Wei F 2013 LS-SVM application for ship course model predictive control. In: 2013 IEEE International Conference on Mechatronics and Automation. IEEE, pp. 1615\u20131619","DOI":"10.1109\/ICMA.2013.6618156"},{"key":"15981_CR130","doi-asserted-by":"publisher","unstructured":"Jiao L, Zhang F, Liu F, et al 2019 A Survey of Deep Learning-Based Object Detection. IEEE Access, pp. 71\u201333. https:\/\/doi.org\/10.1109\/ACCESS.2019.2939201","DOI":"10.1109\/ACCESS.2019.2939201"},{"issue":"April","key":"15981_CR131","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2020.105522","volume":"174","author":"L Jiao","year":"2020","unstructured":"Jiao L, Dong S, Zhang S et al (2020) AF-RCNN: An anchor-free convolutional neural network for multi-categories agricultural pest detection. Comput Electron Agric 174(April):105522. https:\/\/doi.org\/10.1016\/j.compag.2020.105522","journal-title":"Comput Electron Agric"},{"issue":"13","key":"15981_CR132","doi-asserted-by":"publisher","first-page":"19377","DOI":"10.1007\/s11042-021-10702-9","volume":"80","author":"J Jin","year":"2021","unstructured":"Jin J, Zhu A, Wang Y, Wright J (2021) A feature binding model in computer vision for object detection. Multimed Tools Appl 80(13):19377\u201319397. https:\/\/doi.org\/10.1007\/s11042-021-10702-9","journal-title":"Multimed Tools Appl"},{"key":"15981_CR133","doi-asserted-by":"publisher","unstructured":"Jin Y, Zhang Y, Cen Y, et al 2021 Pedestrian detection with super-resolution reconstruction for low-quality image. Pattern Recognit 115107846. https:\/\/doi.org\/10.1016\/j.patcog.2021.107846","DOI":"10.1016\/j.patcog.2021.107846"},{"key":"15981_CR134","unstructured":"Jose A, Thodupunoori H and Nair BB 2019 A Novel Traffi 17"},{"key":"15981_CR135","doi-asserted-by":"crossref","unstructured":"Joseph KJ, Khan S, Khan FS and Balasubramanian VN 2021 Towards Open World Object Detection. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 5826\u20135836","DOI":"10.1109\/CVPR46437.2021.00577"},{"key":"15981_CR136","doi-asserted-by":"publisher","unstructured":"Kalyanam J, Katsuki T, R.G. Lanckriet G and Mackey TK 2017 Exploring trends of nonmedical use of prescription drugs and polydrug abuse in the Twittersphere using unsupervised machine learning. Addict Behav 65(509): 289\u2013295. https:\/\/doi.org\/10.1016\/j.addbeh.2016.08.019","DOI":"10.1016\/j.addbeh.2016.08.019"},{"key":"15981_CR137","doi-asserted-by":"publisher","unstructured":"Kaplan C, Bulbul A (2021) Goal driven network pruning for object recognition. Pattern Recogn 110(1):1\u201311. https:\/\/doi.org\/10.1016\/j.patcog.2020.107468","DOI":"10.1016\/j.patcog.2020.107468"},{"key":"15981_CR138","doi-asserted-by":"crossref","unstructured":"Karatzas D, Mestre SR, Mas J, et al 2011 ICDAR 2011 Robust Reading Competition - Challenge 1: Reading Text in Born-Digital Images (Web and Email). In: 2011 International Conference on Document Analysis and Recognition. IEEE, pp. 1485\u20131490","DOI":"10.1109\/ICDAR.2011.295"},{"key":"15981_CR139","first-page":"92","volume-title":"In: 3rd International Conference on Innovative Trends in Electronics Engineering","author":"J Kaur","year":"2021","unstructured":"Kaur J, Singh W (2021) An Approach Towards Indian Road Sign Detection System Using Deep Learning. In: In: 3rd International Conference on Innovative Trends in Electronics Engineering. Royal Book Publishing (Partner of Eleyon Publishers), pp 92\u2013101"},{"issue":"27","key":"15981_CR140","doi-asserted-by":"publisher","first-page":"38297","DOI":"10.1007\/s11042-022-13153-y","volume":"81","author":"J Kaur","year":"2022","unstructured":"Kaur J, Singh W (2022) Tools, techniques, datasets and application areas for object detection in an image: a review. Multimed Tools Appl 81(27):38297\u201338351. https:\/\/doi.org\/10.1007\/s11042-022-13153-y","journal-title":"Multimed Tools Appl"},{"key":"15981_CR141","doi-asserted-by":"publisher","unstructured":"Kaur RP, Kumar M and Jindal MK 2022 Performance evaluation of different features and classifiers for Gurumukhi newspaper text recognition. J Ambient Intell Humaniz Comput. https:\/\/doi.org\/10.1007\/s12652-021-03687-8","DOI":"10.1007\/s12652-021-03687-8"},{"issue":"1","key":"15981_CR142","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1109\/TCYB.2016.2628161","volume":"48","author":"A Khan","year":"2018","unstructured":"Khan A, Rinner B, Cavallaro A (2018) Cooperative Robots to Observe Moving Targets: Review. IEEE Trans Cybern 48(1):187\u2013198. https:\/\/doi.org\/10.1109\/TCYB.2016.2628161","journal-title":"IEEE Trans Cybern"},{"issue":"11","key":"15981_CR143","doi-asserted-by":"publisher","first-page":"4193","DOI":"10.1080\/01431161.2018.1562260","volume":"40","author":"E Kilic","year":"2019","unstructured":"Kilic E, Ozturk S (2019) A subclass supported convolutional neural network for object detection and localization in remote-sensing images. Int J Remote Sens 40(11):4193\u20134212. https:\/\/doi.org\/10.1080\/01431161.2018.1562260","journal-title":"Int J Remote Sens"},{"issue":"4","key":"15981_CR144","doi-asserted-by":"publisher","first-page":"958","DOI":"10.1049\/ipr2.12159","volume":"16","author":"Y Kim","year":"2021","unstructured":"Kim Y, Hwang H, Shin J (2021) Robust object detection under harsh autonomous-driving environments. IET Image Process 16(4):958\u2013971. https:\/\/doi.org\/10.1049\/ipr2.12159","journal-title":"IET Image Process"},{"key":"15981_CR145","doi-asserted-by":"crossref","unstructured":"Klare BF, Klein B, Taborsky E, et al 2015 Pushing the frontiers of unconstrained face detection and recognition: IARPA Janus Benchmark A. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 1931\u20131939","DOI":"10.1109\/CVPR.2015.7298803"},{"key":"15981_CR146","doi-asserted-by":"crossref","unstructured":"Kostinger M, Wohlhart P, Roth PM and Bischof H 2011 Annotated Facial Landmarks in the Wild: A large-scale, real-world database for facial landmark localization. In: 2011 IEEE International Conference on Computer Vision Workshops (ICCV Workshops). IEEE, pp. 2144\u20132151","DOI":"10.1109\/ICCVW.2011.6130513"},{"key":"15981_CR147","doi-asserted-by":"publisher","unstructured":"Kousik N, Natarajan Y, Arshath Raja R, et al 2021 Improved salient object detection using hybrid Convolution Recurrent Neural Network. Expert Syst Appl, pp. 1661\u201333. https:\/\/doi.org\/10.1016\/j.eswa.2020.114064","DOI":"10.1016\/j.eswa.2020.114064"},{"issue":"6","key":"15981_CR148","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2017) ImageNet classification with deep convolutional neural networks. Commun ACM 60(6):84\u201390. https:\/\/doi.org\/10.1145\/3065386","journal-title":"Commun ACM"},{"issue":"2019","key":"15981_CR149","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1016\/j.procs.2020.02.129","volume":"169","author":"S Kulik","year":"2020","unstructured":"Kulik S, Shtanko A (2020) Using convolutional neural networks for recognition of objects varied in appearance in computer vision for intellectual robots. Procedia Comput Sci 169(2019):164\u2013167. https:\/\/doi.org\/10.1016\/j.procs.2020.02.129","journal-title":"Procedia Comput Sci"},{"issue":"2019","key":"15981_CR150","doi-asserted-by":"publisher","first-page":"2610","DOI":"10.1016\/j.procs.2020.04.283","volume":"171","author":"A Kumar","year":"2020","unstructured":"Kumar A, Srivastava S (2020) Object Detection System Based on Convolution Neural Networks Using Single Shot Multi-Box Detector. Procedia Comput Sci 171(2019):2610\u20132617. https:\/\/doi.org\/10.1016\/j.procs.2020.04.283","journal-title":"Procedia Comput Sci"},{"issue":"10","key":"15981_CR151","doi-asserted-by":"publisher","first-page":"14565","DOI":"10.1007\/s11042-020-10457-9","volume":"80","author":"A Kumar","year":"2021","unstructured":"Kumar A, Kumar M, Kaur A (2021) Face detection in still images under occlusion and non-uniform illumination. Multimed Tools Appl 80(10):14565\u201314590. https:\/\/doi.org\/10.1007\/s11042-020-10457-9","journal-title":"Multimed Tools Appl"},{"issue":"7","key":"15981_CR152","doi-asserted-by":"publisher","first-page":"1956","DOI":"10.1007\/s11263-020-01316-z","volume":"128","author":"A Kuznetsova","year":"2020","unstructured":"Kuznetsova A, Rom H, Alldrin N et al (2020) The Open Images Dataset V4. Int J Comput Vis 128(7):1956\u20131981. https:\/\/doi.org\/10.1007\/s11263-020-01316-z","journal-title":"Int J Comput Vis"},{"key":"15981_CR153","doi-asserted-by":"crossref","unstructured":"Kuznetsova A, Maleva T and Soloviev V 2020 Detecting Apples in Orchards Using YOLOv3 and YOLOv5 in General and Close-Up Images. In: Neurocomputing. Springer, pp. 233\u2013243","DOI":"10.1007\/978-3-030-64221-1_20"},{"key":"15981_CR154","unstructured":"Lam D, Kuzma R, McGee K, et al 2018 xView: Objects in Context in Overhead Imagery. arxiv"},{"key":"15981_CR155","doi-asserted-by":"crossref","unstructured":"Lan W, Dang J, Wang Y and Wang S 2018 Pedestrian detection based on yolo network model. In: Proceedings of 2018 IEEE International Conference on Mechatronics and Automation, ICMA 2018. IEEE, pp. 1547\u20131551","DOI":"10.1109\/ICMA.2018.8484698"},{"issue":"4","key":"15981_CR156","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1049\/itr2.12030","volume":"15","author":"R Laroca","year":"2021","unstructured":"Laroca R, Zanlorensi LA, Gon\u00e7alves GR et al (2021) An efficient and layout-independent automatic license plate recognition system based on the YOLO detector. IET Intell Transp Syst 15(4):1\u201321. https:\/\/doi.org\/10.1049\/itr2.12030","journal-title":"IET Intell Transp Syst"},{"issue":"3","key":"15981_CR157","doi-asserted-by":"publisher","first-page":"642","DOI":"10.1007\/s11263-019-01204-1","volume":"128","author":"H Law","year":"2020","unstructured":"Law H, Deng J (2020) CornerNet: Detecting Objects as Paired Keypoints. Int J Comput Vis 128(3):642\u2013656. https:\/\/doi.org\/10.1007\/s11263-019-01204-1","journal-title":"Int J Comput Vis"},{"key":"15981_CR158","doi-asserted-by":"crossref","unstructured":"Lazebnik S, Schmid C and Ponce J 2006 Beyond Bags of Features: Spatial Pyramid Matching for Recognizing Natural Scene Categories. In: 2006 IEEE Computer Society Conference on Computer Vision and Pattern Recognition - Volume 2 (CVPR\u201906). IEEE, 2169\u20132178","DOI":"10.1109\/CVPR.2006.68"},{"key":"15981_CR159","unstructured":"Learned-Miller E and Jain V 2010 FDDB: A Benchmark for Face Detection in Unconstrained Settings"},{"issue":"26\u201327","key":"15981_CR160","doi-asserted-by":"publisher","first-page":"34237","DOI":"10.1007\/s11042-020-09924-0","volume":"80","author":"D-H Lee","year":"2021","unstructured":"Lee D-H (2021) CNN-based single object detection and tracking in videos and its application to drone detection. Multimed Tools Appl 80(26\u201327):34237\u201334248. https:\/\/doi.org\/10.1007\/s11042-020-09924-0","journal-title":"Multimed Tools Appl"},{"issue":"2","key":"15981_CR161","doi-asserted-by":"publisher","first-page":"242","DOI":"10.1002\/rob.21985","volume":"38","author":"FS Leira","year":"2021","unstructured":"Leira FS, Helgesen HH, Johansen TA, Fossen TI (2021) Object detection, recognition, and tracking from UAVs using a thermal camera. J F Robot 38(2):242\u2013267. https:\/\/doi.org\/10.1002\/rob.21985","journal-title":"J F Robot"},{"key":"15981_CR162","doi-asserted-by":"publisher","unstructured":"Leksut JT, Zhao J, Itti L (2020) Learning visual variation for object recognition. Image Vis Comput 98103912. https:\/\/doi.org\/10.1016\/j.imavis.2020.103912","DOI":"10.1016\/j.imavis.2020.103912"},{"key":"15981_CR163","doi-asserted-by":"crossref","unstructured":"Li J, Liang X, Wei Y, et al 2017 Perceptual Generative Adversarial Networks for Small Object Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 1951\u20131959","DOI":"10.1109\/CVPR.2017.211"},{"key":"15981_CR164","doi-asserted-by":"publisher","unstructured":"Li Y, Zhang Y, Huang X and Yuille AL 2018 Deep networks under scene-level supervision for multi-class geospatial object detection from remote sensing images. ISPRS J Photogramm Remote Sens, pp. 1461\u201330. https:\/\/doi.org\/10.1016\/j.isprsjprs.2018.09.014","DOI":"10.1016\/j.isprsjprs.2018.09.014"},{"key":"15981_CR165","doi-asserted-by":"crossref","unstructured":"Li Z, Peng C, Yu G, et al 2018 DetNet: A Backbone network for Object Detection. 1\u201317","DOI":"10.1007\/978-3-030-01240-3_21"},{"key":"15981_CR166","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2019","unstructured":"Li K, Wan G, Cheng G et al (2019) 2020 Object detection in optical remote sensing images: A survey and a new benchmark. ISPRS J Photogramm Remote Sens 159:296\u2013307. https:\/\/doi.org\/10.1016\/j.isprsjprs.2019.11.023","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"15981_CR167","doi-asserted-by":"crossref","unstructured":"Li Y, Chen Y, Wang N and Zhang Z-X 2019 Scale-Aware Trident Networks for Object Detection. In: 2019 IEEE\/CVF International Conference on Computer Vision (ICCV). IEEE, pp. 6053\u20136062","DOI":"10.1109\/ICCV.2019.00615"},{"key":"15981_CR168","doi-asserted-by":"publisher","unstructured":"Li C, Cong R, Guo C, et al 2020 A parallel down-up fusion network for salient object detection in optical remote sensing images. Neurocomputing, pp. 415411\u2013420. https:\/\/doi.org\/10.1016\/j.neucom.2020.05.108","DOI":"10.1016\/j.neucom.2020.05.108"},{"key":"15981_CR169","doi-asserted-by":"crossref","unstructured":"Li F, Luo Z, Huang J, et al 2020 AlTwo: Vehicle Recognition in Foggy Weather Based on Two-Step Recognition Algorithm. In: Neurocomputing. Springer, pp. 130\u2013141","DOI":"10.1007\/978-3-030-64221-1_12"},{"key":"15981_CR170","doi-asserted-by":"crossref","unstructured":"Li X, Li Y and Li S 2020 Recent Advances of Generic Object Detection with Deep Learning: A Review. In: Need more specific jurnal, pp. 185\u2013193","DOI":"10.1007\/978-981-33-4601-7_19"},{"issue":"19","key":"15981_CR171","doi-asserted-by":"publisher","first-page":"7343","DOI":"10.1080\/01431161.2020.1757782","volume":"41","author":"X Li","year":"2020","unstructured":"Li X, Luo M, Ji S et al (2020) Evaluating generative adversarial networks based image-level domain transfer for multi-source remote sensing image segmentation and object detection. Int J Remote Sens 41(19):7343\u20137367. https:\/\/doi.org\/10.1080\/01431161.2020.1757782","journal-title":"Int J Remote Sens"},{"issue":"6","key":"15981_CR172","doi-asserted-by":"publisher","first-page":"1747","DOI":"10.1016\/j.cja.2020.02.024","volume":"33","author":"Y Li","year":"2020","unstructured":"Li Y, Dong H, Li H et al (2020) Multi-block SSD based on small object detection for UAV railway scene surveillance. Chin J Aeronaut 33(6):1747\u20131755. https:\/\/doi.org\/10.1016\/j.cja.2020.02.024","journal-title":"Chin J Aeronaut"},{"issue":"3","key":"15981_CR173","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1016\/j.cja.2020.09.022","volume":"34","author":"B Li","year":"2021","unstructured":"Li B, Xie X, Wei X, Tang W (2021) Ship detection and classification from optical remote sensing images: A survey. Chin J Aeronaut 34(3):145\u2013163. https:\/\/doi.org\/10.1016\/j.cja.2020.09.022","journal-title":"Chin J Aeronaut"},{"issue":"9","key":"15981_CR174","doi-asserted-by":"publisher","first-page":"1998","DOI":"10.1049\/ipr2.12171","volume":"15","author":"G Li","year":"2021","unstructured":"Li G, Huang X, Ai J et al (2021) Lemon-YOLO: An efficient object detection method for lemons in the natural environment. IET Image Process 15(9):1998\u20132009. https:\/\/doi.org\/10.1049\/ipr2.12171","journal-title":"IET Image Process"},{"key":"15981_CR175","unstructured":"Li C, Li L, Jiang H, et al 2022 YOLOv6: A Single-Stage Object Detection Framework for Industrial Applications. arXiv"},{"issue":"12","key":"15981_CR176","doi-asserted-by":"publisher","first-page":"6999","DOI":"10.1109\/TNNLS.2021.3084827","volume":"33","author":"Z Li","year":"2022","unstructured":"Li Z, Liu F, Yang W et al (2022) A Survey of Convolutional Neural Networks: Analysis, Applications, and Prospects. IEEE Trans Neural Networks Learn Syst 33(12):6999\u20137019. https:\/\/doi.org\/10.1109\/TNNLS.2021.3084827","journal-title":"IEEE Trans Neural Networks Learn Syst"},{"issue":"11","key":"15981_CR177","doi-asserted-by":"publisher","first-page":"3484","DOI":"10.1109\/TNNLS.2019.2892409","volume":"30","author":"F Liao","year":"2019","unstructured":"Liao F, Liang M, Li Z et al (2019) Evaluate the Malignancy of Pulmonary Nodules Using the 3-D Deep Leaky Noisy-OR Network. IEEE Trans Neural Networks Learn Syst 30(11):3484\u20133495. https:\/\/doi.org\/10.1109\/TNNLS.2019.2892409","journal-title":"IEEE Trans Neural Networks Learn Syst"},{"issue":"1","key":"15981_CR178","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1007\/s44196-021-00056-3","volume":"15","author":"J Liao","year":"2022","unstructured":"Liao J, Liu Y, Piao Y et al (2022) GLE-Net: A Global and Local Ensemble Network for Aerial Object Detection. Int J Comput Intell Syst 15(1):2. https:\/\/doi.org\/10.1007\/s44196-021-00056-3","journal-title":"Int J Comput Intell Syst"},{"key":"15981_CR179","doi-asserted-by":"publisher","unstructured":"Lin TY, Maire M, Belongie S et al (2014) Microsoft COCO: Common objects in context. Lect Notes Comput Sci (including Subser Lect Notes Artif Intell Lect Notes Bioinformatics) 8693 LNCS (PART 5): 740\u2013755. https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"15981_CR180","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Dollar P, Girshick R, et al 2017 Feature Pyramid Networks for Object Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 936\u2013944","DOI":"10.1109\/CVPR.2017.106"},{"key":"15981_CR181","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Goyal P, Girshick R, et al 2017 Focal Loss for Dense Object Detection. In: 2017 IEEE International Conference on Computer Vision (ICCV). IEEE, pp. 2999\u20133007","DOI":"10.1109\/ICCV.2017.324"},{"key":"15981_CR182","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1145\/3342999.3343013","volume":"22","author":"M Lin","year":"2019","unstructured":"Lin M, Chen C, Lai C (2019) Object detection algorithm based AdaBoost residual correction Fast R-CNN on network. ACM Int Conf Proc Ser 22:42\u201346. https:\/\/doi.org\/10.1145\/3342999.3343013","journal-title":"ACM Int Conf Proc Ser"},{"issue":"October","key":"15981_CR183","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1016\/j.media.2017.07.005","volume":"42","author":"G Litjens","year":"2017","unstructured":"Litjens G, Kooi T, Bejnordi BE et al (2017) A survey on deep learning in medical image analysis. Med Image Anal 42(October):60\u201388. https:\/\/doi.org\/10.1016\/j.media.2017.07.005","journal-title":"Med Image Anal"},{"issue":"9","key":"15981_CR184","doi-asserted-by":"publisher","first-page":"1938","DOI":"10.1109\/LGRS.2015.2439517","volume":"12","author":"K Liu","year":"2015","unstructured":"Liu K, Mattyus G (2015) Fast Multiclass Vehicle Detection on Aerial Images. IEEE Geosci Remote Sens Lett 12(9):1938\u20131942. https:\/\/doi.org\/10.1109\/LGRS.2015.2439517","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"15981_CR185","first-page":"21","volume-title":"European conference on computer vision","author":"W Liu","year":"2016","unstructured":"Liu W, Anguelov D, Erhan D et al (2016) SSD: Single Shot MultiBox Detector. In: European conference on computer vision. Springer, pp 21\u201337"},{"issue":"8","key":"15981_CR186","doi-asserted-by":"publisher","first-page":"1074","DOI":"10.1109\/LGRS.2016.2565705","volume":"13","author":"Z Liu","year":"2016","unstructured":"Liu Z, Wang H, Weng L, Yang Y (2016) Ship Rotated Bounding Box Space for Ship Extraction From High-Resolution Optical Satellite Images With Complex Backgrounds. IEEE Geosci Remote Sens Lett 13(8):1074\u20131078. https:\/\/doi.org\/10.1109\/LGRS.2016.2565705","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"15981_CR187","doi-asserted-by":"publisher","first-page":"2448","DOI":"10.1109\/ICCV.2017.266","volume-title":"In: 2017 IEEE International Conference on Computer Vision (ICCV)","author":"Z Liu","year":"2017","unstructured":"Liu Z, Wang D, Lu H (2017) Stepwise Metric Promotion for Unsupervised Video Person Re-identification. In: In: 2017 IEEE International Conference on Computer Vision (ICCV). IEEE, pp 2448\u20132457"},{"key":"15981_CR188","doi-asserted-by":"publisher","unstructured":"Liu Y, Jin L, Zhang S et al (2019) Curved scene text detection via transverse and longitudinal sequence connection. Pattern Recogn 90337\u2013345. https:\/\/doi.org\/10.1016\/j.patcog.2019.02.002","DOI":"10.1016\/j.patcog.2019.02.002"},{"key":"15981_CR189","doi-asserted-by":"publisher","unstructured":"Liu D, Cui Y, Chen Y, et al 2020 Video object detection for autonomous driving: Motion-aid feature calibration. Neurocomputing 4091\u201311. https:\/\/doi.org\/10.1016\/j.neucom.2020.05.027","DOI":"10.1016\/j.neucom.2020.05.027"},{"issue":"2","key":"15981_CR190","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu L, Ouyang W, Wang X et al (2020) Deep Learning for Generic Object Detection: A Survey. Int J Comput Vis 128(2):261\u2013318. https:\/\/doi.org\/10.1007\/s11263-019-01247-4","journal-title":"Int J Comput Vis"},{"key":"15981_CR191","doi-asserted-by":"publisher","unstructured":"Liu Y, Duanmu M, Huo Z, et al 2021 Exploring multi-scale deformable context and channel-wise attention for salient object detection. Neurocomputing 42892\u2013103. https:\/\/doi.org\/10.1016\/j.neucom.2020.11.022","DOI":"10.1016\/j.neucom.2020.11.022"},{"key":"15981_CR192","doi-asserted-by":"publisher","unstructured":"Liu JJ, Hou Q, Liu ZA, Cheng MM (2022) PoolNet+: Exploring the Potential of Pooling for Salient Object Detection.\u00a0IEEE Trans Pattern Anal Mach Intell\u00a045(1):1\u201318. https:\/\/doi.org\/10.1109\/TPAMI.2021.3140168","DOI":"10.1109\/TPAMI.2021.3140168"},{"issue":"1","key":"15981_CR193","doi-asserted-by":"publisher","first-page":"270","DOI":"10.1080\/01431161.2021.2018146","volume":"43","author":"Y Liu","year":"2022","unstructured":"Liu Y, Liu J, Ning X, Li J (2022) MS-CNN: multiscale recognition of building rooftops from high spatial resolution remote sensing imagery. Int J Remote Sens 43(1):270\u2013298. https:\/\/doi.org\/10.1080\/01431161.2021.2018146","journal-title":"Int J Remote Sens"},{"key":"15981_CR194","doi-asserted-by":"publisher","unstructured":"Loey M, Manogaran G, Taha MHN and Khalifa NEM 2021 Fighting against COVID-19: A novel deep learning model based on YOLO-v2 with ResNet-50 for medical face mask detection. Sustain Cities Soc 65102600. https:\/\/doi.org\/10.1016\/j.scs.2020.102600","DOI":"10.1016\/j.scs.2020.102600"},{"issue":"3","key":"15981_CR195","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1007\/s41095-018-0116-x","volume":"4","author":"Y Lu","year":"2018","unstructured":"Lu Y, Lu J, Zhang S, Hall P (2018) Traffic signal detection and classification in street views using an attention model. Comput Vis Media 4(3):253\u2013266. https:\/\/doi.org\/10.1007\/s41095-018-0116-x","journal-title":"Comput Vis Media"},{"key":"15981_CR196","doi-asserted-by":"publisher","unstructured":"Lu S, Wang B, Wang H, et al. 2019 A real-time object detection algorithm for video. Comput Electr Eng 77398\u2013408. https:\/\/doi.org\/10.1016\/j.compeleceng.2019.05.009","DOI":"10.1016\/j.compeleceng.2019.05.009"},{"key":"15981_CR197","doi-asserted-by":"crossref","unstructured":"Lu W, Zhou Y, Wan G, et al. 2019 L3-Net: Towards Learning Based LiDAR Localization for Autonomous Driving. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 6382\u20136391","DOI":"10.1109\/CVPR.2019.00655"},{"key":"15981_CR198","doi-asserted-by":"publisher","unstructured":"Lu X, Ji J, Xing Z, Miao Q (2021) Attention and feature fusion SSD for remote sensing object detection. IEEE Trans Instrum Meas 70. https:\/\/doi.org\/10.1109\/TIM.2021.3052575","DOI":"10.1109\/TIM.2021.3052575"},{"key":"15981_CR199","doi-asserted-by":"crossref","unstructured":"Lucas SM 2005 ICDAR 2005 text locating competition results. In: Eighth International Conference on Document Analysis and Recognition (ICDAR\u201905). IEEE, pp. 80\u201384 Vol. 1","DOI":"10.1109\/ICDAR.2005.231"},{"key":"15981_CR200","doi-asserted-by":"crossref","unstructured":"Lucas SM, Panaretos A, Sosa L, et al 2003 ICDAR 2003 robust reading competitions. In: Seventh International Conference on Document Analysis and Recognition, 2003. Proceedings. IEEE, pp. 682\u2013687","DOI":"10.1109\/ICDAR.2003.1227749"},{"issue":"6","key":"15981_CR201","doi-asserted-by":"publisher","first-page":"1011","DOI":"10.1049\/iet-its.2018.5489","volume":"13","author":"X Luo","year":"2019","unstructured":"Luo X, Zhu J, Yu Q (2019) Efficient convNets for fast traffic sign recognition. IET Intell Transp Syst 13(6):1011\u20131015. https:\/\/doi.org\/10.1049\/iet-its.2018.5489","journal-title":"IET Intell Transp Syst"},{"key":"15981_CR202","doi-asserted-by":"publisher","unstructured":"Lv X, Su M and Wang Z 2021 Application of Face Recognition Method Under Deep Learning Algorithm in Embedded Systems. Microprocess Microsyst 104034. https:\/\/doi.org\/10.1016\/j.micpro.2021.104034","DOI":"10.1016\/j.micpro.2021.104034"},{"key":"15981_CR203","doi-asserted-by":"publisher","unstructured":"Ma W, Wu Y, Cen F, Wang G (2020) MDFN: Multi-scale deep feature learning network for object detection. Pattern Recognit 100:107149.\u00a0https:\/\/doi.org\/10.1016\/j.patcog.2019.107149","DOI":"10.1016\/j.patcog.2019.107149"},{"key":"15981_CR204","doi-asserted-by":"publisher","unstructured":"Ma C, Sun L, Zhong Z and Huo Q 2021 ReLaText: Exploiting visual relationships for arbitrary-shaped scene text detection with graph convolutional networks. Pattern Recognit 111:107684. https:\/\/doi.org\/10.1016\/j.patcog.2020.107684","DOI":"10.1016\/j.patcog.2020.107684"},{"key":"15981_CR205","doi-asserted-by":"publisher","unstructured":"Ma J, Liang M, Chen S-L, et al 2022 Depth-Guided Progressive Network for Object Detection. IEEE Trans Intell Transp Syst 1\u201311. https:\/\/doi.org\/10.1109\/TITS.2022.3156365","DOI":"10.1109\/TITS.2022.3156365"},{"issue":"1","key":"15981_CR206","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1111\/mice.12561","volume":"36","author":"H Maeda","year":"2021","unstructured":"Maeda H, Kashiyama T, Sekimoto Y et al (2021) Generative adversarial network for road damage detection. Comput Civ Infrastruct Eng 36(1):1\u201314. https:\/\/doi.org\/10.1111\/mice.12561","journal-title":"Comput Civ Infrastruct Eng"},{"key":"15981_CR207","doi-asserted-by":"crossref","unstructured":"Majumdar P, Agarwal A, Singh R and Vatsa M 2019 Evading Face Recognition via Partial Tampering of Faces. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW). IEEE, 11\u201320","DOI":"10.1109\/CVPRW.2019.00008"},{"key":"15981_CR208","first-page":"1","volume-title":"Lecture Notes in Networks and Systems","author":"KL Masita","year":"2022","unstructured":"Masita KL, Hasan AN, Shongwe T (2022) Refining the Efficiency of R-CNN in Pedestrian Detection. In: Lecture Notes in Networks and Systems. Springer, pp 1\u201314"},{"key":"15981_CR209","doi-asserted-by":"publisher","first-page":"158","DOI":"10.1109\/ICB2018.2018.00033","volume-title":"In: 2018 International Conference on Biometrics (ICB)","author":"B Maze","year":"2018","unstructured":"Maze B, Adams J, Duncan JA et al (2018) IARPA Janus Benchmark - C: Face Dataset and Protocol. In: In: 2018 International Conference on Biometrics (ICB). IEEE, pp 158\u2013165"},{"key":"15981_CR210","first-page":"760","volume-title":"In: 2021 5th International Conference on Trends in Electronics and Informatics (ICOEI)","author":"FMJ Mehedi Shamrat","year":"2021","unstructured":"Mehedi Shamrat FMJ, Al JM, Billah MM et al (2021) A Deep Learning Approach for Face Detection using Max Pooling. In: In: 2021 5th International Conference on Trends in Electronics and Informatics (ICOEI). IEEE, pp 760\u2013764"},{"key":"15981_CR211","first-page":"1","volume":"127","author":"A Mishra","year":"2012","unstructured":"Mishra A, Alahari K, Jawahar C (2012) Scene Text Recognition using Higher Order Language Priors. In: Procedings of the British Machine Vision Conference 2012. British Mach Vision Assoc 127:1\u2013127.11","journal-title":"British Mach Vision Assoc"},{"key":"15981_CR212","doi-asserted-by":"publisher","first-page":"2886","DOI":"10.1109\/ICCV48922.2021.00290","volume-title":"In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV)","author":"I Misra","year":"2021","unstructured":"Misra I, Girdhar R, Joulin A (2021) An End-to-End Transformer Model for 3D Object Detection. In: In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV). IEEE, pp 2886\u20132897"},{"key":"15981_CR213","doi-asserted-by":"crossref","unstructured":"Mittal U, Srivastava S and Chawla P 2019 Review of different techniques for object detection using deep learning. In: Proceedings of the Third International Conference on Advanced Informatics for Computing Research - ICAICR \u201819. ACM Press, New York, New York, USA, pp. 1\u20138","DOI":"10.1145\/3339311.3339357"},{"key":"15981_CR214","doi-asserted-by":"publisher","unstructured":"Mittal P, Singh R and Sharma A 2020 Deep learning-based object detection in low-altitude UAV datasets: A survey. Image Vis Comput 104:104046. https:\/\/doi.org\/10.1016\/j.imavis.2020.104046","DOI":"10.1016\/j.imavis.2020.104046"},{"issue":"4","key":"15981_CR215","doi-asserted-by":"publisher","first-page":"1484","DOI":"10.1109\/TITS.2012.2209421","volume":"13","author":"A Mogelmose","year":"2012","unstructured":"Mogelmose A, Trivedi MM, Moeslund TB (2012) Vision-Based Traffic Sign Detection and Analysis for Intelligent Driver Assistance Systems: Perspectives and Survey. IEEE Trans Intell Transp Syst 13(4):1484\u20131497. https:\/\/doi.org\/10.1109\/TITS.2012.2209421","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"15981_CR216","doi-asserted-by":"crossref","unstructured":"Murdock M, Reid S, Hamilton B and Reese J 2015 ICDAR 2015 competition on text line detection in historical documents. In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR). IEEE, pp. 1171\u20131175","DOI":"10.1109\/ICDAR.2015.7333945"},{"key":"15981_CR217","doi-asserted-by":"crossref","unstructured":"Nada H, Sindagi VA, Zhang H and Patel VM 2018 Pushing the Limits of Unconstrained Face Detection: a Challenge Dataset and Baseline Results. In: 2018 IEEE 9th International Conference on Biometrics Theory, Applications and Systems (BTAS). IEEE, pp. 1\u201310","DOI":"10.1109\/BTAS.2018.8698561"},{"key":"15981_CR218","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.114549","volume":"170","author":"F Naiemi","year":"2020","unstructured":"Naiemi F (2020) Ghods V and Khalesi H 2021 A novel pipeline framework for multi oriented scene text image detection and recognition. Expert Syst Appl 170:114549. https:\/\/doi.org\/10.1016\/j.eswa.2020.114549","journal-title":"Expert Syst Appl"},{"key":"15981_CR219","doi-asserted-by":"crossref","unstructured":"Najibi M, Samangouei P, Chellappa R and Davis LS 2017 SSH: Single Stage Headless Face Detector. In: Proceedings of the IEEE International Conference on Computer Vision. IEEE, 4885\u20134894","DOI":"10.1109\/ICCV.2017.522"},{"issue":"10","key":"15981_CR220","doi-asserted-by":"publisher","first-page":"1396","DOI":"10.1049\/iet-its.2018.5171","volume":"12","author":"S Natarajan","year":"2018","unstructured":"Natarajan S, Annamraju AK, Baradkar CS (2018) Traffic sign recognition using weighted multi-convolutional neural network. IET Intell Transp Syst 12(10):1396\u20131405. https:\/\/doi.org\/10.1049\/iet-its.2018.5171","journal-title":"IET Intell Transp Syst"},{"key":"15981_CR221","doi-asserted-by":"publisher","first-page":"691","DOI":"10.1007\/978-3-030-20887-5_43","volume-title":"Computer Vision \u2013 ACCV 2018","author":"L Neumann","year":"2019","unstructured":"Neumann L, Karg M, Zhang S et al (2019) NightOwls: A Pedestrians at Night Dataset. In: Li H, Mori G, Schindler K (eds) Computer Vision \u2013 ACCV 2018. Springer International Publishing, pp 691\u2013705"},{"key":"15981_CR222","doi-asserted-by":"publisher","unstructured":"Nguyen DT, Li W and Ogunbona PO 2016 Human detection from images and videos: A survey. Pattern Recognit 51148\u2013175. https:\/\/doi.org\/10.1016\/j.patcog.2015.08.027","DOI":"10.1016\/j.patcog.2015.08.027"},{"issue":"1","key":"15981_CR223","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1109\/jpets.2018.2881429","volume":"6","author":"VN Nguyen","year":"2019","unstructured":"Nguyen VN, Jenssen R, Roverso D (2019) Intelligent Monitoring and Inspection of Power Line Components Powered by UAVs and Deep Learning. IEEE Power Energy Technol Syst J 6(1):11\u201321. https:\/\/doi.org\/10.1109\/jpets.2018.2881429","journal-title":"IEEE Power Energy Technol Syst J"},{"key":"15981_CR224","doi-asserted-by":"crossref","unstructured":"Nie GY, Cheng MM, Liu Y, et al 2019 Multi-level context ultra-aggregation for stereo matching. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition. IEEE, 3278\u20133286","DOI":"10.1109\/CVPR.2019.00340"},{"issue":"10","key":"15981_CR225","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1002\/ecj.12268","volume":"103","author":"R Ogura","year":"2020","unstructured":"Ogura R, Nagasaki T, Matsubara H (2020) Improving the visibility of nighttime images for pedestrian recognition using in-vehicle camera. Electron Commun Japan 103(10):35\u201343. https:\/\/doi.org\/10.1002\/ecj.12268","journal-title":"Electron Commun Japan"},{"key":"15981_CR226","doi-asserted-by":"publisher","unstructured":"Oksuz K, Cam BC, Kalkan S and Akbas E 2019 Imbalance problems in object detection: A review. arXiv 8828(c):. https:\/\/doi.org\/10.1109\/tpami.2020.2981890","DOI":"10.1109\/tpami.2020.2981890"},{"issue":"3s","key":"15981_CR227","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3092831","volume":"13","author":"K Ota","year":"2017","unstructured":"Ota K, Dao MS, Mezaris V, De Natale FGB (2017) Deep learning for mobile multimedia: A survey. ACM Trans Multimed Comput Commun Appl 13(3s):1\u201322. https:\/\/doi.org\/10.1145\/3092831","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"15981_CR228","doi-asserted-by":"crossref","unstructured":"Ouyang W, Wang X, Zeng X, et al 2015 DeepID-Net: Deformable deep convolutional neural networks for object detection. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 2403\u20132412","DOI":"10.1109\/CVPR.2015.7298854"},{"key":"15981_CR229","doi-asserted-by":"crossref","unstructured":"Padilla R, Netto SL and da Silva EABB 2020 A Survey on Performance Metrics for Object-Detection Algorithms. In: 2020 International Conference on Systems, Signals and Image Processing (IWSSIP). IEEE, 237\u2013242","DOI":"10.1109\/IWSSIP48289.2020.9145130"},{"key":"15981_CR230","doi-asserted-by":"publisher","unstructured":"Pang Y, Cao J, Li Y, et al 2021 TJU-DHD: A Diverse High-Resolution Dataset for Object Detection. IEEE Trans Image Process 30207\u2013219. https:\/\/doi.org\/10.1109\/TIP.2020.3034487","DOI":"10.1109\/TIP.2020.3034487"},{"issue":"1","key":"15981_CR231","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1023\/A:1008162616689","volume":"38","author":"C Papageorgiou","year":"2000","unstructured":"Papageorgiou C, Poggio T (2000) Trainable system for object detection. Int J Comput Vis 38(1):15\u201333. https:\/\/doi.org\/10.1023\/A:1008162616689","journal-title":"Int J Comput Vis"},{"issue":"June","key":"15981_CR232","doi-asserted-by":"publisher","first-page":"1706","DOI":"10.1016\/j.procs.2018.05.144","volume":"132","author":"AR Pathak","year":"2018","unstructured":"Pathak AR, Pandey M, Rautaray S (2018) Application of Deep Learning for Object Detection. Procedia Comput Sci 132(June):1706\u20131717. https:\/\/doi.org\/10.1016\/j.procs.2018.05.144","journal-title":"Procedia Comput Sci"},{"issue":"2","key":"15981_CR233","first-page":"194","volume":"4","author":"S Paul","year":"1986","unstructured":"Paul S (1986) Information processing in dynamical systems: foundations of harmony theory. J Japan Soc Fuzzy Theory Syst 4(2):194\u2013281","journal-title":"J Japan Soc Fuzzy Theory Syst"},{"key":"15981_CR234","doi-asserted-by":"publisher","unstructured":"P\u00e9rez-Hern\u00e1ndez F, Tabik S, Lamas A, et al 2020 Object Detection Binary Classifiers methodology based on deep learning to identify small objects handled similarly: Application in video surveillance. Knowledge-Based Syst 1941\u201310. https:\/\/doi.org\/10.1016\/j.knosys.2020.105590","DOI":"10.1016\/j.knosys.2020.105590"},{"key":"15981_CR235","doi-asserted-by":"crossref","unstructured":"Perronnin F, S\u00e1nchez J and Mensink T 2010 Improving the Fisher Kernel for Large-Scale Image Classification. In: Journal of AOAC INTERNATIONAL. Springer, pp. 143\u2013156","DOI":"10.1007\/978-3-642-15561-1_11"},{"issue":"21","key":"15981_CR236","doi-asserted-by":"publisher","first-page":"4500","DOI":"10.3390\/app9214500","volume":"9","author":"Phung and Rhee","year":"2019","unstructured":"Phung and Rhee (2019) A High-Accuracy Model Average Ensemble of Convolutional Neural Networks for Classification of Cloud Image Patches on Small Datasets. Appl Sci 9(21):4500. https:\/\/doi.org\/10.3390\/app9214500","journal-title":"Appl Sci"},{"issue":"5","key":"15981_CR237","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3234150","volume":"51","author":"S Pouyanfar","year":"2019","unstructured":"Pouyanfar S, Sadiq S, Yan Y et al (2019) A Survey on Deep learning: Algorithmm Techniques and Applications. ACM Comput Surv 51(5):1\u201336. https:\/\/doi.org\/10.1145\/3234150","journal-title":"ACM Comput Surv"},{"key":"15981_CR238","first-page":"193","volume-title":"ACM International Conference Proceeding Series","author":"Q Qi","year":"2018","unstructured":"Qi Q, Tan W, Zhang K, Huang M (2018) Object detection with multi-RCNN detectors. In: ACM International Conference Proceeding Series. ACM, New York, NY, USA, pp 193\u2013197"},{"key":"15981_CR239","doi-asserted-by":"publisher","unstructured":"Qin S and Liu S 2021 Towards end-to-end car license plate location and recognition in unconstrained scenarios. Neural Comput Appl 1\u201311. https:\/\/doi.org\/10.1007\/s00521-021-06147-8","DOI":"10.1007\/s00521-021-06147-8"},{"issue":"5","key":"15981_CR240","doi-asserted-by":"publisher","first-page":"869","DOI":"10.1049\/gtd2.12333","volume":"16","author":"Z Qiu","year":"2021","unstructured":"Qiu Z, Zhu X, Liao C et al (2021) Detection of bird species related to transmission line faults based on lightweight convolutional neural network. IET Gener Transm Distrib 16(5):869\u2013881. https:\/\/doi.org\/10.1049\/gtd2.12333","journal-title":"IET Gener Transm Distrib"},{"issue":"8","key":"15981_CR241","doi-asserted-by":"publisher","first-page":"2947","DOI":"10.1109\/TIP.2019.2955239","volume":"29","author":"MM Rahman","year":"2020","unstructured":"Rahman MM, Tan Y, Xue J, Lu K (2020) Recent Advances in 3D Object Detection in the Era of Deep Neural Networks: A Survey. IEEE Trans Image Process 29(8):2947\u20132962. https:\/\/doi.org\/10.1109\/TIP.2019.2955239","journal-title":"IEEE Trans Image Process"},{"key":"15981_CR242","first-page":"581","volume-title":"Advances in Intelligent Systems and Computing","author":"MM Rahman","year":"2021","unstructured":"Rahman MM, Al MS, Kaiser MS et al (2021) Cascade Classification of Face Liveliness Detection Using Heart Beat Measurement. In: Advances in Intelligent Systems and Computing. Springer, pp 581\u2013590"},{"issue":"6","key":"15981_CR243","doi-asserted-by":"publisher","first-page":"462","DOI":"10.18196\/jrc.26123","volume":"2","author":"W Rahmaniar","year":"2021","unstructured":"Rahmaniar W, Hernawan A (2021) Real-Time Human Detection Using Deep Learning on Embedded Platforms: A Review | Rahmaniar |. J Robot Control (JRC) J Robot Cont 2(6):462\u2013468. https:\/\/doi.org\/10.18196\/jrc.26123","journal-title":"J Robot Control (JRC) J Robot Cont"},{"key":"15981_CR244","doi-asserted-by":"publisher","unstructured":"Ramzi M, Larbi G and Lyamine G 2019 Road obstacle detection. ACM Int Conf Proceeding Ser. https:\/\/doi.org\/10.1145\/3341325.3341999","DOI":"10.1145\/3341325.3341999"},{"key":"15981_CR245","doi-asserted-by":"crossref","unstructured":"Ravishankar V, Vinod V, Kumar T and Bhalla K 2022 Sensor Integration and Facial Recognition Deployment in a Smart Home System. Springer, 759\u2013771","DOI":"10.1007\/978-981-16-6407-6_65"},{"key":"15981_CR246","doi-asserted-by":"publisher","unstructured":"Razakarivony S and Jurie F 2016 Vehicle detection in aerial imagery: A small target detection benchmark. J Vis Commun Image Represent 34187\u2013203. https:\/\/doi.org\/10.1016\/j.jvcir.2015.11.002","DOI":"10.1016\/j.jvcir.2015.11.002"},{"key":"15981_CR247","doi-asserted-by":"crossref","unstructured":"Redmon J and Farhadi A 2017 YOLO9000: Better, Faster, Stronger. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 6517\u20136525","DOI":"10.1109\/CVPR.2017.690"},{"key":"15981_CR248","unstructured":"Redmon J and Farhadi A 2018 YOLOv3: An Incremental Improvement. Comput Vis Pattern Recognit 1\u20136"},{"key":"15981_CR249","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R and Farhadi A 2016 You Only Look Once: Unified, Real-Time Object Detection. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"issue":"March","key":"15981_CR250","doi-asserted-by":"publisher","DOI":"10.1016\/j.mehy.2020.109705","volume":"141","author":"ZU Rehman","year":"2020","unstructured":"Rehman ZU, Zia MS, Bojja GR et al (2020) Texture based localization of a brain tumor from MR-images by using a machine learning approach. Med Hypotheses 141(March):109705. https:\/\/doi.org\/10.1016\/j.mehy.2020.109705","journal-title":"Med Hypotheses"},{"issue":"6","key":"15981_CR251","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149. https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR252","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/3447587.3447591","volume-title":"2021 The 4th International Conference on Image and Graphics Processing","author":"J Ren","year":"2021","unstructured":"Ren J, Ren M, Liu R et al (2021) An Effective Imaging System for 3D Detection of Occluded Objects. In: 2021 The 4th International Conference on Image and Graphics Processing. ACM, New York, NY, USA, pp 20\u201330"},{"key":"15981_CR253","doi-asserted-by":"crossref","unstructured":"Renu Chebrolu KN and Kumar PN 2019 Deep Learning based Pedestrian Detection at all Light Conditions. In: 2019 International Conference on Communication and Signal Processing (ICCSP). IEEE, pp. 1\u20135","DOI":"10.1109\/ICCSP.2019.8698101"},{"issue":"18","key":"15981_CR254","doi-asserted-by":"publisher","first-page":"8027","DOI":"10.1016\/j.eswa.2014.07.008","volume":"41","author":"A Risnumawan","year":"2014","unstructured":"Risnumawan A, Shivakumara P, Chan CS, Tan CL (2014) A robust arbitrary text detection system for natural scene images. Expert Syst Appl 41(18):8027\u20138048. https:\/\/doi.org\/10.1016\/j.eswa.2014.07.008","journal-title":"Expert Syst Appl"},{"key":"15981_CR255","doi-asserted-by":"crossref","unstructured":"Rukhovich D, Vorontsova A and Konushin A 2022 ImVoxelNet: Image to Voxels Projection for Monocular and Multi-View General-Purpose 3D Object Detection. In: 2022 IEEE\/CVF Winter Conference on Applications of Computer Vision (WACV). IEEE, pp. 1265\u20131274","DOI":"10.1109\/WACV51458.2022.00133"},{"key":"15981_CR256","doi-asserted-by":"publisher","unstructured":"Sabu K and Rao P 2021 Prosodic event detection in children\u2019s read speech. Comput Speech Lang 68101200. https:\/\/doi.org\/10.1016\/j.csl.2021.101200","DOI":"10.1016\/j.csl.2021.101200"},{"issue":"1","key":"15981_CR257","doi-asserted-by":"publisher","first-page":"e1","DOI":"10.1002\/mp.13264","volume":"46","author":"B Sahiner","year":"2019","unstructured":"Sahiner B, Pezeshk A, Hadjiiski LM et al (2019) Deep learning in medical imaging and radiation therapy. Med Phys 46(1):e1\u2013e36. https:\/\/doi.org\/10.1002\/mp.13264","journal-title":"Med Phys"},{"issue":"2019","key":"15981_CR258","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1016\/j.procs.2020.04.022","volume":"171","author":"NGS Sai Srinath","year":"2020","unstructured":"Sai Srinath NGS, Joseph AZ, Umamaheswaran S et al (2020) NITCAD - Developing an object detection, classification and stereo vision dataset for autonomous navigation in Indian roads. Procedia Comput Sci 171(2019):207\u2013216. https:\/\/doi.org\/10.1016\/j.procs.2020.04.022","journal-title":"Procedia Comput Sci"},{"key":"15981_CR259","doi-asserted-by":"crossref","unstructured":"Saleh K, Szenasi S and Vamossy Z 2021 Occlusion Handling in Generic Object Detection: A Review. In: 2021 IEEE 19th World Symposium on Applied Machine Intelligence and Informatics (SAMI). IEEE, 000477\u2013000484","DOI":"10.1109\/SAMI50585.2021.9378657"},{"key":"15981_CR260","doi-asserted-by":"crossref","unstructured":"Sanchez JA, Toselli AH, Romero V and Vidal E 2015 ICDAR 2015 competition HTRtS: Handwritten Text Recognition on the tranScriptorium dataset. In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR). IEEE, pp. 1166\u20131170","DOI":"10.1109\/ICDAR.2015.7333944"},{"key":"15981_CR261","doi-asserted-by":"crossref","unstructured":"Sanchez JA, Romero V, Toselli AH, et al 2017 ICDAR2017 Competition on Handwritten Text Recognition on the READ Dataset. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR). IEEE, pp. 1383\u20131388","DOI":"10.1109\/ICDAR.2017.226"},{"key":"15981_CR262","doi-asserted-by":"crossref","unstructured":"Sch\u00f6ller FET, Plenge-Feidenhans\u2019L MK, Stets JD and Blanke M 2019 Assessing Deep-learning Methods for Object Detection at Sea from LWIR Images. In: IFAC-PapersOnLine. Elsevier Ltd, pp. 64\u201371","DOI":"10.1016\/j.ifacol.2019.12.284"},{"key":"15981_CR263","unstructured":"Sermanet P, Eigen D, Zhang X, et al 2014 Overfeat: Integrated recognition, localization and detection using convolutional networks. 2nd Int Conf Learn Represent ICLR 2014 - Conf Track Proc"},{"key":"15981_CR264","doi-asserted-by":"crossref","unstructured":"Setta S, Sinha S, Mishra M and Choudhury P 2022 Real-Time Facial Recognition Using SURF-FAST. In: Lecture Notes on Data Engineering and Communications Technologies, pp. 505\u2013522","DOI":"10.1007\/978-981-16-2937-2_32"},{"key":"15981_CR265","doi-asserted-by":"crossref","unstructured":"Shahab A, Shafait F and Dengel A 2011 ICDAR 2011 Robust Reading Competition Challenge 2: Reading Text in Scene Images. In: 2011 International Conference on Document Analysis and Recognition. IEEE, pp. 1491\u20131496","DOI":"10.1109\/ICDAR.2011.296"},{"key":"15981_CR266","doi-asserted-by":"publisher","unstructured":"Shao Z, Cheng G, Ma J, et al 2021 Real-time and Accurate UAV Pedestrian Detection for Social Distancing Monitoring in COVID-19 Pandemic. IEEE Trans Multimed 1\u20131. https:\/\/doi.org\/10.1109\/TMM.2021.3075566","DOI":"10.1109\/TMM.2021.3075566"},{"key":"15981_CR267","doi-asserted-by":"publisher","unstructured":"Sharma V, Mir RN (2019) Saliency guided faster-RCNN (SGFr-RCNN) model for object detection and recognition.\u00a0J King Saud Univ - Comput Inf Sci\u00a034(5):0\u201312. https:\/\/doi.org\/10.1016\/j.jksuci.2019.09.012","DOI":"10.1016\/j.jksuci.2019.09.012"},{"key":"15981_CR268","doi-asserted-by":"publisher","unstructured":"Sharma V and Mir RN 2020 A comprehensive and systematic look up into deep learning based object detection techniques: A review. Comput Sci Rev 38:100301. https:\/\/doi.org\/10.1016\/j.cosrev.2020.100301","DOI":"10.1016\/j.cosrev.2020.100301"},{"key":"15981_CR269","doi-asserted-by":"crossref","unstructured":"Sharma N, Mandal R, Sharma R, et al 2015 ICDAR2015 Competition on Video Script Identification (CVSI 2015). In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR). IEEE, pp. 1196\u20131200","DOI":"10.1109\/ICDAR.2015.7333950"},{"key":"15981_CR270","doi-asserted-by":"publisher","unstructured":"Shashirangana J, Padmasiri H, Meedeniya D, et al 2021 License plate recognition using neural architecture search for edge devices. Int J Intell Syst 1\u201338. https:\/\/doi.org\/10.1002\/int.22471","DOI":"10.1002\/int.22471"},{"key":"15981_CR271","doi-asserted-by":"publisher","unstructured":"Shen ZY, Han SY, Fu LC, et al 2019 Deep convolution neural network with scene-centric and object-centric information for object detection. Image Vis Comput 85:14\u201325. https:\/\/doi.org\/10.1016\/j.imavis.2019.03.004","DOI":"10.1016\/j.imavis.2019.03.004"},{"key":"15981_CR272","doi-asserted-by":"publisher","unstructured":"Shepley AJ, Falzon G, Kwan P and Brankovic L 2023 Confluence: A Robust Non-IoU Alternative to Non-Maxima Suppression in Object Detection. IEEE Trans Pattern Anal Mach Intell 1\u201316. https:\/\/doi.org\/10.1109\/TPAMI.2023.3273210","DOI":"10.1109\/TPAMI.2023.3273210"},{"key":"15981_CR273","doi-asserted-by":"crossref","unstructured":"Shi X, Shan S, Kan M, et al 2018 Real-Time Rotation-Invariant Face Detection with Progressive Calibration Networks. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition. IEEE, pp. 2295\u20132303","DOI":"10.1109\/CVPR.2018.00244"},{"key":"15981_CR274","doi-asserted-by":"publisher","unstructured":"Shi Y, Zhang Z, Huang K, et al 2020 Human-computer interaction based on face feature localization. J Vis Commun Image Represent 70:1\u20136. https:\/\/doi.org\/10.1016\/j.jvcir.2019.102740","DOI":"10.1016\/j.jvcir.2019.102740"},{"key":"15981_CR275","unstructured":"Shrivastava A, Sukthankar R, Malik J and Gupta A 2016 Beyond Skip Connections: Top-Down Modulation for Object Detection"},{"key":"15981_CR276","doi-asserted-by":"publisher","unstructured":"Shyu M, Chen S, Iyengar SS (2020) A survey on deep learning algorithms, techniques, and applications. Strad Res 7(8). https:\/\/doi.org\/10.37896\/sr7.8\/037","DOI":"10.37896\/sr7.8\/037"},{"issue":"May 2019","key":"15981_CR277","doi-asserted-by":"publisher","DOI":"10.1016\/j.aap.2019.105319","volume":"134","author":"FW Siebert","year":"2020","unstructured":"Siebert FW, Lin H (2020) Detecting motorcycle helmet use with deep learning. Accid Anal Prev 134(May 2019):105319. https:\/\/doi.org\/10.1016\/j.aap.2019.105319","journal-title":"Accid Anal Prev"},{"key":"15981_CR278","unstructured":"Simonyan K and Zisserman A 2015 Very deep convolutional networks for large-scale image recognition. In: 3rd International Conference on Learning Representations, ICLR 2015 - Conference Track Proceedings. arXiv, 1\u201314"},{"key":"15981_CR279","doi-asserted-by":"publisher","unstructured":"Singh S and Prasad SVAV 2018 Techniques and challenges of face recognition: A critical review. Procedia Comput Sci 143:536\u2013543. https:\/\/doi.org\/10.1016\/j.procs.2018.10.427","DOI":"10.1016\/j.procs.2018.10.427"},{"key":"15981_CR280","doi-asserted-by":"crossref","unstructured":"Song H, Wang W, Zhao S, et al. 2018 Pyramid Dilated Deeper ConvLSTM for Video Salient Object Detection. In: Computer Vision \u2013 ECCV 2018. ECCV 2018. Lecture Notes in Computer Science, pp. 744\u2013760","DOI":"10.1007\/978-3-030-01252-6_44"},{"key":"15981_CR281","doi-asserted-by":"publisher","unstructured":"Song X, Wang P, Zhou D, et al 2019 APOLLOCAR3D: A large 3D car instance understanding benchmark for autonomous driving. Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 2019-June, pp. 5447\u20135457. https:\/\/doi.org\/10.1109\/CVPR.2019.00560","DOI":"10.1109\/CVPR.2019.00560"},{"key":"15981_CR282","doi-asserted-by":"publisher","unstructured":"Sri Jamiya S and Rani PE 2021 LittleYOLO-SPP: A delicate real-time vehicle detection algorithm. Optik (Stuttg) 225:165818. https:\/\/doi.org\/10.1016\/j.ijleo.2020.165818","DOI":"10.1016\/j.ijleo.2020.165818"},{"key":"15981_CR283","doi-asserted-by":"crossref","unstructured":"Su H, Wei S, Yan M, et al 2019 Object Detection and Instance Segmentation in Remote Sensing Imagery Based on Precise Mask R-CNN. In: IGARSS 2019\u20132019 IEEE International Geoscience and Remote Sensing Symposium. IEEE, 1454\u20131457","DOI":"10.1109\/IGARSS.2019.8898573"},{"issue":"4","key":"15981_CR284","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1049\/trit.2018.1026","volume":"3","author":"S Sun","year":"2018","unstructured":"Sun S, Yin Y, Wang X et al (2018) Fast object detection based on binary deep convolution neural networks. CAAI Trans Intell Technol 3(4):198\u2013207. https:\/\/doi.org\/10.1049\/trit.2018.1026","journal-title":"CAAI Trans Intell Technol"},{"key":"15981_CR285","first-page":"5686","volume-title":"In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"K Sun","year":"2019","unstructured":"Sun K, Xiao B, Liu D, Wang J (2019) Deep High-Resolution Representation Learning for Human Pose Estimation. In: In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp 5686\u20135696"},{"key":"15981_CR286","unstructured":"Sun K, Zhao Y, Jiang B, et al. 2019 High-Resolution Representations for Labeling Pixels and Regions"},{"key":"15981_CR287","doi-asserted-by":"crossref","unstructured":"Sun Y, Karatzas D, Chan CS, et al 2019 ICDAR 2019 Competition on Large-Scale Street View Text with Partial Labeling - RRC-LSVT. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). IEEE, pp. 1557\u20131562","DOI":"10.1109\/ICDAR.2019.00250"},{"key":"15981_CR288","doi-asserted-by":"publisher","unstructured":"Sun P, Zheng Y, Zhou Z, et al. 2020 R4 Det: Refined single-stage detector with feature recursion and refinement for rotating object detection in aerial images. Image Vis Comput 1031\u201326. https:\/\/doi.org\/10.1016\/j.imavis.2020.104036","DOI":"10.1016\/j.imavis.2020.104036"},{"issue":"1","key":"15981_CR289","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1080\/22797254.2021.1880975","volume":"54","author":"F Sun","year":"2021","unstructured":"Sun F, Li H, Liu Z et al (2021) Arbitrary-angle bounding box based location for object detection in remote sensing image. Eur J Remote Sens 54(1):102\u2013116. https:\/\/doi.org\/10.1080\/22797254.2021.1880975","journal-title":"Eur J Remote Sens"},{"key":"15981_CR290","doi-asserted-by":"publisher","unstructured":"Sun X, Wang P, Wang C, et al 2021 PBNet: Part-based convolutional neural network for complex composite object detection in remote sensing imagery. ISPRS J Photogramm Remote Sens 173:50\u201365. https:\/\/doi.org\/10.1016\/j.isprsjprs.2020.12.015","DOI":"10.1016\/j.isprsjprs.2020.12.015"},{"issue":"10","key":"15981_CR291","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/tee.23215","volume":"15","author":"T Suzuki","year":"2020","unstructured":"Suzuki T, Kageyama Y, Ishizawa C (2020) Recognition Method for Speed Limit Signs and its Applicability in Recognition of Vehicle Entry Prohibition Signs at Night. IEEJ Trans Electr Electron Eng 15(10):1\u20139. https:\/\/doi.org\/10.1002\/tee.23215","journal-title":"IEEJ Trans Electr Electron Eng"},{"issue":"6","key":"15981_CR292","doi-asserted-by":"publisher","first-page":"4307","DOI":"10.1016\/j.aej.2021.09.043","volume":"61","author":"M Tamilselvi","year":"2022","unstructured":"Tamilselvi M, Karthikeyan S (2022) An ingenious face recognition system based on HRPSM_CNN under unrestrained environmental condition. Alexandria Eng J 61(6):4307\u20134321. https:\/\/doi.org\/10.1016\/j.aej.2021.09.043","journal-title":"Alexandria Eng J"},{"key":"15981_CR293","doi-asserted-by":"crossref","unstructured":"Tan M, Pang R and Le Q V. 2019 EfficientDet: Scalable and efficient object detection. arXiv 10781\u201310790","DOI":"10.1109\/CVPR42600.2020.01079"},{"issue":"July","key":"15981_CR294","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.autcon.2020.103356","volume":"120","author":"S Tang","year":"2020","unstructured":"Tang S, Roberts D, Golparvar-Fard M (2020) Human-object interaction recognition for automatic construction site safety inspection. Autom Constr 120(July):1\u201316. https:\/\/doi.org\/10.1016\/j.autcon.2020.103356","journal-title":"Autom Constr"},{"key":"15981_CR295","doi-asserted-by":"crossref","unstructured":"Tanner F, Colder B, Pullen C, et al 2009 Overhead imagery research data set \u2014 an annotated data library & tools to aid in the development of computer vision algorithms. In: 2009 IEEE Applied Imagery Pattern Recognition Workshop (AIPR 2009). IEEE, pp. 1\u20138","DOI":"10.1109\/AIPR.2009.5466304"},{"key":"15981_CR296","doi-asserted-by":"crossref","unstructured":"Tarchoun B, Jegham I, Khalifa AB, et al 2020 Deep CNN-based Pedestrian Detection for Intelligent Infrastructure. In: 2020 5th International Conference on Advanced Technologies for Signal and Image Processing (ATSIP). IEEE, 1\u20136","DOI":"10.1109\/ATSIP49331.2020.9231712"},{"key":"15981_CR297","doi-asserted-by":"publisher","unstructured":"Taskiran M, Kahraman N and Erdem CE 2020 Face recognition: Past, present and future (a review). Digit Signal Process 1061\u201328. https:\/\/doi.org\/10.1016\/j.dsp.2020.102809","DOI":"10.1016\/j.dsp.2020.102809"},{"key":"15981_CR298","unstructured":"Terven J and Cordova-Esparza D 2023 A Comprehensive Review of YOLO: From YOLOv1 to YOLOv8 and Beyond. 1\u201327"},{"issue":"5","key":"15981_CR299","doi-asserted-by":"publisher","first-page":"416","DOI":"10.1080\/2150704X.2020.1722330","volume":"11","author":"Z Tian","year":"2020","unstructured":"Tian Z, Zhan R, Wang W et al (2020) Object detection in optical remote sensing images by integrating object-to-object relationships. Remote Sens Lett 11(5):416\u2013425. https:\/\/doi.org\/10.1080\/2150704X.2020.1722330","journal-title":"Remote Sens Lett"},{"key":"15981_CR300","first-page":"633","volume-title":"Machine Vision and Applications","author":"R Timofte","year":"2014","unstructured":"Timofte R, Zimmermann K, Van Gool L (2014) Multi-view traffic sign detection, recognition, and 3D localisation. In: Machine Vision and Applications. Springer, pp 633\u2013647"},{"key":"15981_CR301","doi-asserted-by":"publisher","unstructured":"Tong K, Wu Y and Zhou F 2020 Recent advances in small object detection based on deep learning: A review. Image Vis Comput 97:103910. https:\/\/doi.org\/10.1016\/j.imavis.2020.103910","DOI":"10.1016\/j.imavis.2020.103910"},{"key":"15981_CR302","first-page":"252","volume-title":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","author":"P Tran","year":"2021","unstructured":"Tran P, Pattichis M, Celed\u00f3n-Pattichis S, L\u00f3pezLeiva C (2021) Facial Recognition in Collaborative Learning Videos. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). Springer, pp 252\u2013261"},{"key":"15981_CR303","doi-asserted-by":"publisher","first-page":"262","DOI":"10.1109\/ICCE48956.2021.9352140","volume-title":"In: 2020 IEEE Eighth International Conference on Communications and Electronics (ICCE)","author":"T-H Tran","year":"2021","unstructured":"Tran T-H, Nguyen DT, Phuong Nguyen T (2021) Human Posture Classification from Multiple Viewpoints and Application for Fall Detection. In: In: 2020 IEEE Eighth International Conference on Communications and Electronics (ICCE). IEEE, pp 262\u2013267"},{"issue":"June","key":"15981_CR304","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/j.bdr.2017.06.002","volume":"11","author":"D Triantafyllidou","year":"2018","unstructured":"Triantafyllidou D, Nousi P, Tefas A (2018) Fast Deep Convolutional Face Detection in the Wild Exploiting Hard Sample Mining. Big Data Res 11(June):65\u201376. https:\/\/doi.org\/10.1016\/j.bdr.2017.06.002","journal-title":"Big Data Res"},{"issue":"2","key":"15981_CR305","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1007\/s11263-013-0620-5","volume":"104","author":"JRR Uijlings","year":"2013","unstructured":"Uijlings JRR, van de Sande KEA, Gevers T, Smeulders AWM (2013) Selective Search for Object Recognition. Int J Comput Vis 104(2):154\u2013171. https:\/\/doi.org\/10.1007\/s11263-013-0620-5","journal-title":"Int J Comput Vis"},{"issue":"2","key":"15981_CR306","doi-asserted-by":"publisher","first-page":"721","DOI":"10.1007\/s12652-020-02845-8","volume":"13","author":"S Umer","year":"2022","unstructured":"Umer S, Rout RK, Pero C, Nappi M (2022) Facial expression recognition with trade-offs between data augmentation and deep learning features. J Ambient Intell Humaniz Comput 13(2):721\u2013735. https:\/\/doi.org\/10.1007\/s12652-020-02845-8","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"15981_CR307","first-page":"419","volume-title":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","author":"M Vandersteegen","year":"2018","unstructured":"Vandersteegen M, Van Beeck K, Goedem\u00e9 T (2018) Real-Time Multispectral Pedestrian Detection with a Single-Pass Deep Neural Network. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). Springer, pp 419\u2013426"},{"key":"15981_CR308","doi-asserted-by":"publisher","unstructured":"Vashisht M, Kumar B 2020 A Survey Paper on Object Detection Methods in Image Processing. 2020 Int Conf Comput Sci Eng Appl ICCSEA 2020. https:\/\/doi.org\/10.1109\/ICCSEA49143.2020.9132871","DOI":"10.1109\/ICCSEA49143.2020.9132871"},{"key":"15981_CR309","unstructured":"Veit A, Matera T, Neumann L, et al 2016 COCO-Text: Dataset and Benchmark for Text Detection and Recognition in Natural Images"},{"key":"15981_CR310","first-page":"1","volume-title":"In: 2019 IEEE International Conference on Consumer Electronics (ICCE)","author":"A Vennelakanti","year":"2019","unstructured":"Vennelakanti A, Shreya S, Rajendran R et al (2019) Traffic Sign Detection and Recognition using a CNN Ensemble. In: In: 2019 IEEE International Conference on Consumer Electronics (ICCE). IEEE, pp 1\u20134"},{"key":"15981_CR311","doi-asserted-by":"publisher","unstructured":"Voulodimos A, Doulamis N, Doulamis A, Protopapadakis E (2018) Deep Learning for Computer Vision: A Brief Review. Comput Intell Neurosci 20181\u201313. https:\/\/doi.org\/10.1155\/2018\/7068349","DOI":"10.1155\/2018\/7068349"},{"key":"15981_CR312","doi-asserted-by":"publisher","unstructured":"Vuola AO, Akram SU and Kannala J 2019 Mask-RCNN and u-net ensembled for nuclei segmentation. Proc - Int Symp Biomed Imaging 2019-April (Isbi): 208\u2013212. https:\/\/doi.org\/10.1109\/ISBI.2019.8759574","DOI":"10.1109\/ISBI.2019.8759574"},{"issue":"4","key":"15981_CR313","doi-asserted-by":"publisher","first-page":"359","DOI":"10.1049\/rsn2.12042","volume":"15","author":"AM Wallace","year":"2021","unstructured":"Wallace AM, Mukherjee S, Toh B, Ahrabian A (2021) Combining automotive radar and LiDAR for surface detection in adverse conditions. IET Radar, Sonar Navig 15(4):359\u2013369. https:\/\/doi.org\/10.1049\/rsn2.12042","journal-title":"IET Radar, Sonar Navig"},{"issue":"7","key":"15981_CR314","doi-asserted-by":"publisher","first-page":"4487","DOI":"10.1109\/TITS.2020.3017505","volume":"22","author":"S Wan","year":"2021","unstructured":"Wan S, Xu X, Wang T, Gu Z (2021) An Intelligent Video Analysis Method for Abnormal Event Detection in Intelligent Transportation Systems. IEEE Trans Intell Transp Syst 22(7):4487\u20134495. https:\/\/doi.org\/10.1109\/TITS.2020.3017505","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"15981_CR315","doi-asserted-by":"publisher","unstructured":"Wang W 2020 Detection of panoramic vision pedestrian based on deep learning. Image Vis Comput 103:103986. https:\/\/doi.org\/10.1016\/j.imavis.2020.103986","DOI":"10.1016\/j.imavis.2020.103986"},{"key":"15981_CR316","doi-asserted-by":"crossref","unstructured":"Wang K and Belongie S 2010 Word Spotting in the Wild. In: 11th European Conference on Computer Vision. Springer, 591\u2013604","DOI":"10.1007\/978-3-642-15549-9_43"},{"issue":"22","key":"15981_CR317","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/cpe.4675","volume":"30","author":"Q Wang","year":"2018","unstructured":"Wang Q, Fu W (2018) Research on traffic sign detection algorithm based on deep learning. Concurr Comput Pract Exp 30(22):1\u20138. https:\/\/doi.org\/10.1002\/cpe.4675","journal-title":"Concurr Comput Pract Exp"},{"issue":"1","key":"15981_CR318","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1080\/22797254.2021.2018944","volume":"55","author":"H Wang","year":"2022","unstructured":"Wang H, Miao F (2022) Building extraction from remote sensing images using deep residual U-Net. Eur J Remote Sens 55(1):71\u201385. https:\/\/doi.org\/10.1080\/22797254.2021.2018944","journal-title":"Eur J Remote Sens"},{"key":"15981_CR319","unstructured":"Wang J, Yuan Y and Yu G 2017 Face Attention Network: An Effective Face Detector for the Occluded Faces. 1\u201310"},{"key":"15981_CR320","doi-asserted-by":"publisher","unstructured":"Wang S, Du Y and Huang Z 2017 Ear detection using fully convolutional networks. ACM Int Conf Proceeding Ser Part F 1319:50\u201355. https:\/\/doi.org\/10.1145\/3141166.3141168","DOI":"10.1145\/3141166.3141168"},{"issue":"1","key":"15981_CR321","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1109\/TIP.2017.2754941","volume":"27","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Shao L (2018) Video Salient Object Detection via Fully Convolutional Networks. IEEE Trans Image Process 27(1):38\u201349. https:\/\/doi.org\/10.1109\/TIP.2017.2754941","journal-title":"IEEE Trans Image Process"},{"issue":"1","key":"15981_CR322","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1109\/TPAMI.2017.2662005","volume":"40","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Yang R, Porikli F (2018) A Unified Spatiotemporal Prior based on Geodesic Distance for Video Object Segmentation. IEEE Trans Pattern Anal Mach Intell 40(1):20\u201333. https:\/\/doi.org\/10.1109\/TPAMI.2017.2662005","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"1","key":"15981_CR323","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1109\/TPAMI.2017.2662005","volume":"40","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Yang R, Porikli F (2018) Saliency-Aware Video Object Segmentation. IEEE Trans Pattern Anal Mach Intell 40(1):20\u201333. https:\/\/doi.org\/10.1109\/TPAMI.2017.2662005","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR324","doi-asserted-by":"crossref","unstructured":"Wang H, Li J, Zhou Y, et al 2019 Research on the Technology of Indoor and Outdoor Integration Robot Inspection in Substation. In: 2019 IEEE 3rd Information Technology, Networking, Electronic and Automation Control Conference (ITNEC). IEEE, 2366\u20132369","DOI":"10.1109\/ITNEC.2019.8729355"},{"issue":"March 2018","key":"15981_CR325","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1016\/j.image.2018.09.013","volume":"70","author":"R Wang","year":"2019","unstructured":"Wang R, Xu J, Han TX (2019) Object instance detection with pruned Alexnet and extended training data. Signal Process Image Commun 70(March 2018):145\u2013156. https:\/\/doi.org\/10.1016\/j.image.2018.09.013","journal-title":"Signal Process Image Commun"},{"key":"15981_CR326","doi-asserted-by":"crossref","unstructured":"Wang W, Xie E, Li X, et al 2019 Shape Robust Text Detection With Progressive Scale Expansion Network. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 9336\u20139345","DOI":"10.1109\/CVPR.2019.00956"},{"key":"15981_CR327","doi-asserted-by":"crossref","unstructured":"Wang A, Sun Y, Kortylewski A and Yuille A 2020 Robust Object Detection Under Occlusion With Context-Aware CompositionalNets. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 12642\u201312651","DOI":"10.1109\/CVPR42600.2020.01266"},{"key":"15981_CR328","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A and Liao H-YM 2020 Scaled-YOLOv4: Scaling Cross Stage Partial Network. arXiv","DOI":"10.1109\/CVPR46437.2021.01283"},{"key":"15981_CR329","doi-asserted-by":"publisher","unstructured":"Wang N, Wang Y and Er MJ 2020 Review on deep learning techniques for marine object recognition: Architectures and algorithms. Control Eng Pract (April): 104458. https:\/\/doi.org\/10.1016\/j.conengprac.2020.104458","DOI":"10.1016\/j.conengprac.2020.104458"},{"key":"15981_CR330","doi-asserted-by":"publisher","unstructured":"Wang Q, Zhang L, Li Y and Kpalma K 2020 Overview of deep-learning based methods for salient object detection in videos. Pattern Recognit 104:107340. https:\/\/doi.org\/10.1016\/j.patcog.2020.107340","DOI":"10.1016\/j.patcog.2020.107340"},{"key":"15981_CR331","doi-asserted-by":"crossref","unstructured":"Wang Y, Xie H, Zha Z, et al 2020 ContourNet: Taking a Further Step Toward Accurate Arbitrary-Shaped Scene Text Detection. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 11753\u201311762","DOI":"10.1109\/CVPR42600.2020.01177"},{"key":"15981_CR332","doi-asserted-by":"crossref","unstructured":"Wang J, Song L, Li Z, et al 2021 End-to-End Object Detection with Fully Convolutional Network. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 15844\u201315853","DOI":"10.1109\/CVPR46437.2021.01559"},{"key":"15981_CR333","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A and Liao H-YM 2022 YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. 1\u201315","DOI":"10.1109\/CVPR52729.2023.00721"},{"issue":"1","key":"15981_CR334","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1049\/ipr2.12340","volume":"16","author":"G Wang","year":"2022","unstructured":"Wang G, Ding H, Li B et al (2022) Trident-YOLO: Improving the precision and speed of mobile device object detection. IET Image Process 16(1):145\u2013157. https:\/\/doi.org\/10.1049\/ipr2.12340","journal-title":"IET Image Process"},{"issue":"1","key":"15981_CR335","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3466780","volume":"18","author":"J Wang","year":"2022","unstructured":"Wang J, Min W, Hou S et al (2022) LogoDet-3K: A Large-scale Image Dataset for Logo Detection. ACM Trans Multimed Comput Commun Appl 18(1):1\u201319. https:\/\/doi.org\/10.1145\/3466780","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"issue":"December 2019","key":"15981_CR336","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2020.102907","volume":"193","author":"L Wen","year":"2020","unstructured":"Wen L, Du D, Cai Z et al (2020) UA-DETRAC: A new benchmark and protocol for multi-object detection and tracking. Comput Vis Image Underst 193(December 2019):102907. https:\/\/doi.org\/10.1016\/j.cviu.2020.102907","journal-title":"Comput Vis Image Underst"},{"issue":"8","key":"15981_CR337","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1049\/iet-cvi.2018.5654","volume":"13","author":"F Wong","year":"2019","unstructured":"Wong F, Hu H (2019) Adaptive learning feature pyramid for object detection. IET Comput Vis 13(8):742\u2013748. https:\/\/doi.org\/10.1049\/iet-cvi.2018.5654","journal-title":"IET Comput Vis"},{"key":"15981_CR338","doi-asserted-by":"publisher","unstructured":"Wo\u017aniak M, Po\u0142ap D (2018) Object detection and recognition via clustered features. Neurocomputing 3201\u20139. https:\/\/doi.org\/10.1016\/j.neucom.2018.09.003","DOI":"10.1016\/j.neucom.2018.09.003"},{"key":"15981_CR339","doi-asserted-by":"crossref","unstructured":"Wu C-W and Ding J-J 2021 Multi-Viewpoint Patterns and Occlusions Handling Using Hybrid Features for Vehicle Tracking. In: 2021 IEEE International Symposium on Circuits and Systems (ISCAS). IEEE, 1\u20135","DOI":"10.1109\/ISCAS51556.2021.9401298"},{"key":"15981_CR340","first-page":"280","volume-title":"In: 2018 11th International Symposium on Computational Intelligence and Design (ISCID)","author":"S Wu","year":"2018","unstructured":"Wu S, Zhang L (2018) Using Popular Object Detection Methods for Real Time Forest Fire Detection. In: In: 2018 11th International Symposium on Computational Intelligence and Design (ISCID). IEEE, pp 280\u2013284"},{"key":"15981_CR341","doi-asserted-by":"crossref","unstructured":"Wu J, Zhou C, Zhang Q, et al 2020 Self-Mimic Learning for Small-scale Pedestrian Detection. In: Proceedings of the 28th ACM International Conference on Multimedia. ACM, New York, NY, USA, pp. 1\u20139","DOI":"10.1145\/3394171.3413634"},{"key":"15981_CR342","doi-asserted-by":"publisher","unstructured":"Wu K, Bai C, Wang D, et al 2021 Improved Object Detection Algorithm of YOLOv3 Remote Sensing Image. IEEE Access 9113889\u2013113900. https:\/\/doi.org\/10.1109\/ACCESS.2021.3103522","DOI":"10.1109\/ACCESS.2021.3103522"},{"key":"15981_CR343","doi-asserted-by":"publisher","unstructured":"Wu S, Xu Y, Zhang B, et al 2021 Deformable Template Network (DTN) for Object Detection. IEEE Trans Multimed 1\u201311. https:\/\/doi.org\/10.1109\/TMM.2021.3075323","DOI":"10.1109\/TMM.2021.3075323"},{"issue":"1","key":"15981_CR344","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1049\/cvi2.12015","volume":"15","author":"Y Wu","year":"2021","unstructured":"Wu Y, Feng S, Huang X, Wu Z (2021) L4Net: An anchor-free generic object detector with attention mechanism for autonomous driving. IET Comput Vis 15(1):36\u201346. https:\/\/doi.org\/10.1049\/cvi2.12015","journal-title":"IET Comput Vis"},{"issue":"Xx","key":"15981_CR345","doi-asserted-by":"publisher","first-page":"3113","DOI":"10.1109\/TIP.2021.3058783","volume":"30","author":"YH Wu","year":"2021","unstructured":"Wu YH, Gao SH, Mei J et al (2021) JCS: An Explainable COVID-19 Diagnosis System by Joint Classification and Segmentation. IEEE Trans Image Process 30(Xx):3113\u20133126. https:\/\/doi.org\/10.1109\/TIP.2021.3058783","journal-title":"IEEE Trans Image Process"},{"issue":"108214","key":"15981_CR346","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patcog.2021.108214","volume":"122","author":"J Wu","year":"2022","unstructured":"Wu J, Du J, Wang F et al (2022) A multimodal attention fusion network with a dynamic vocabulary for TextVQA. Pattern Recogn 122(108214):1\u201310. https:\/\/doi.org\/10.1016\/j.patcog.2021.108214","journal-title":"Pattern Recogn"},{"key":"15981_CR347","doi-asserted-by":"publisher","unstructured":"Xia GS, Bai X, Ding J, et al 2018 DOTA: A Large-Scale Dataset for Object Detection in Aerial Images. Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 3974\u20133983. https:\/\/doi.org\/10.1109\/CVPR.2018.00418","DOI":"10.1109\/CVPR.2018.00418"},{"issue":"33\u201334","key":"15981_CR348","doi-asserted-by":"publisher","first-page":"23729","DOI":"10.1007\/s11042-020-08976-6","volume":"79","author":"Y Xiao","year":"2020","unstructured":"Xiao Y, Tian Z, Yu J et al (2020) A review of object detection based on deep learning. Multimed Tools Appl 79(33\u201334):23729\u201323791. https:\/\/doi.org\/10.1007\/s11042-020-08976-6","journal-title":"Multimed Tools Appl"},{"key":"15981_CR349","doi-asserted-by":"publisher","unstructured":"Xiao Y, Jiang A, Ye J, Wang M-W (2020) Making of Night Vision: Object Detection Under Low-Illumination. IEEE Access 8123075\u2013123086. https:\/\/doi.org\/10.1109\/ACCESS.2020.3007610","DOI":"10.1109\/ACCESS.2020.3007610"},{"issue":"March","key":"15981_CR350","doi-asserted-by":"publisher","DOI":"10.1016\/j.autcon.2021.103721","volume":"127","author":"B Xiao","year":"2021","unstructured":"Xiao B, Lin Q, Chen Y (2021) A vision-based method for automatic tracking of construction machines at nighttime based on deep learning illumination enhancement. Autom Constr 127(March):103721. https:\/\/doi.org\/10.1016\/j.autcon.2021.103721","journal-title":"Autom Constr"},{"key":"15981_CR351","doi-asserted-by":"crossref","unstructured":"Xing J, Fang G, Zhong J and Li J 2019 Application of Face Recognition Based on CNN in Fatigue Driving Detection. In: Proceedings of the 2019 International Conference on Artificial Intelligence and Advanced Manufacturing - AIAM 2019. ACM Press, New York, New York, USA, 1\u20135","DOI":"10.1145\/3358331.3358387"},{"issue":"10","key":"15981_CR352","doi-asserted-by":"publisher","first-page":"1578","DOI":"10.1049\/gtd2.12088","volume":"15","author":"S Xiong","year":"2021","unstructured":"Xiong S, Liu Y, Yan Y et al (2021) Object recognition for power equipment via human-level concept learning. IET Gener Transm Distrib 15(10):1578\u20131587. https:\/\/doi.org\/10.1049\/gtd2.12088","journal-title":"IET Gener Transm Distrib"},{"key":"15981_CR353","doi-asserted-by":"crossref","unstructured":"Xu D, Ouyang W, Ricci E, et al 2017 Learning Cross-Modal Deep Representations for Robust Pedestrian Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 5363\u20135371","DOI":"10.1109\/CVPR.2017.451"},{"key":"15981_CR354","doi-asserted-by":"crossref","unstructured":"Xu S, Cheng Y, Gu K, et al 2017 Jointly Attentive Spatial-Temporal Pooling Networks for Video-Based Person Re-identification. In: 2017 IEEE International Conference on Computer Vision (ICCV). IEEE, 4743\u20134752","DOI":"10.1109\/ICCV.2017.507"},{"issue":"1s","key":"15981_CR355","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3414839","volume":"17","author":"X Xu","year":"2021","unstructured":"Xu X, Wang S, Wang Z et al (2021) Exploring Image Enhancement for Salient Object Detection in Low Light Images. ACM Trans Multimed Comput Commun Appl 17(1s):1\u201319. https:\/\/doi.org\/10.1145\/3414839","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"15981_CR356","doi-asserted-by":"publisher","unstructured":"Xu B, Wang W, Guo L, et al 2022 CattleFaceNet: A cattle face identification approach based on RetinaFace and ArcFace loss. Comput Electron Agric 193:106675. https:\/\/doi.org\/10.1016\/j.compag.2021.106675","DOI":"10.1016\/j.compag.2021.106675"},{"key":"15981_CR357","doi-asserted-by":"publisher","unstructured":"Xu H, Guo M, Nedjah N, et al 2022 Vehicle and Pedestrian Detection Algorithm Based on Lightweight YOLOv3-Promote and Semi-Precision Acceleration. IEEE Trans Intell Transp Syst 1\u201312. https:\/\/doi.org\/10.1109\/TITS.2021.3137253","DOI":"10.1109\/TITS.2021.3137253"},{"key":"15981_CR358","doi-asserted-by":"publisher","unstructured":"Xue C, Lu S and Hoi S 2022 Detection and rectification of arbitrary shaped scene texts by using text keypoints and links. Pattern Recognit 1241\u201331. https:\/\/doi.org\/10.1016\/j.patcog.2021.108494","DOI":"10.1016\/j.patcog.2021.108494"},{"issue":"4","key":"15981_CR359","doi-asserted-by":"publisher","first-page":"611","DOI":"10.1007\/s13244-018-0639-9","volume":"9","author":"R Yamashita","year":"2018","unstructured":"Yamashita R, Nishio M, Do RKG, Togashi K (2018) Convolutional neural networks: an overview and application in radiology. Insights Imaging 9(4):611\u2013629. https:\/\/doi.org\/10.1007\/s13244-018-0639-9","journal-title":"Insights Imaging"},{"key":"15981_CR360","unstructured":"Yang B, Yan J, Lei Z, Li SZ 2015 Fine-grained evaluation on face detection in the wild. In: 2015 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (FG). IEEE, 1\u20137"},{"key":"15981_CR361","doi-asserted-by":"crossref","unstructured":"Yang S, Luo P, Loy CC and Tang X 2016 WIDER FACE: A Face Detection Benchmark. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, 5525\u20135533","DOI":"10.1109\/CVPR.2016.596"},{"key":"15981_CR362","unstructured":"Yang S, Xiong Y, Loy CC and Tang X 2017 Face Detection through Scale-Friendly Deep Convolutional Networks"},{"issue":"8","key":"15981_CR363","doi-asserted-by":"publisher","first-page":"1845","DOI":"10.1109\/TPAMI.2017.2738644","volume":"40","author":"S Yang","year":"2018","unstructured":"Yang S, Luo P, Loy CC, Tang X (2018) Faceness-Net: Face Detection through Deep Facial Part Responses. IEEE Trans Pattern Anal Mach Intell 40(8):1845\u20131859. https:\/\/doi.org\/10.1109\/TPAMI.2017.2738644","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"15981_CR364","doi-asserted-by":"crossref","unstructured":"Yang T, Wu J, Liu L, et al 2020 VTD-Net: Depth Face Forgery Oriented Video Tampering Detection based on Convolutional Neural Network. In: 2020 39th Chinese Control Conference (CCC). IEEE, 7247\u20137251","DOI":"10.23919\/CCC50068.2020.9188580"},{"issue":"4","key":"15981_CR365","doi-asserted-by":"publisher","first-page":"1837","DOI":"10.1007\/s00542-019-04694-8","volume":"27","author":"H Yang","year":"2021","unstructured":"Yang H, Liu P, Hu Y, Fu J (2021) Research on underwater object recognition based on YOLOv3. Microsyst Technol 27(4):1837\u20131844. https:\/\/doi.org\/10.1007\/s00542-019-04694-8","journal-title":"Microsyst Technol"},{"issue":"1","key":"15981_CR366","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1049\/ipr2.12005","volume":"15","author":"W Yang","year":"2021","unstructured":"Yang W, Zhang J, Chen Z, Xu Z (2021) An efficient semantic segmentation method based on transfer learning from object detection. IET Image Process 15(1):57\u201364. https:\/\/doi.org\/10.1049\/ipr2.12005","journal-title":"IET Image Process"},{"key":"15981_CR367","unstructured":"Yao C, Bai X, Liu W, et al. 2012 Detecting texts of arbitrary orientations in natural images. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition. IEEE, 1083\u20131090"},{"key":"15981_CR368","doi-asserted-by":"publisher","unstructured":"Yao L, Liu H, Hu Z, et al 2019 Cow face detection and recognition based on automatic feature extraction algorithm. ACM Int Conf Proceeding Ser. https:\/\/doi.org\/10.1145\/3321408.3322628","DOI":"10.1145\/3321408.3322628"},{"issue":"November 2018","key":"15981_CR369","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2019.102827","volume":"189","author":"J Yi","year":"2019","unstructured":"Yi J, Wu P, Metaxas DN (2019) ASSD: Attentive single shot multibox detector. Comput Vis Image Underst 189(November 2018):102827. https:\/\/doi.org\/10.1016\/j.cviu.2019.102827","journal-title":"Comput Vis Image Underst"},{"key":"15981_CR370","doi-asserted-by":"crossref","unstructured":"Yu H, Zhang C, Li X, et al 2019 An End-to-End Video Text Detector with Online Tracking. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). IEEE, 601\u2013606","DOI":"10.1109\/ICDAR.2019.00102"},{"key":"15981_CR371","doi-asserted-by":"crossref","unstructured":"Yu Z, Zhuge Y, Lu H and Zhang L 2019 Joint learning of saliency detection and weakly supervised semantic segmentation. In: Proceedings of the IEEE International Conference on Computer Vision. IEEE, 7222\u20137232","DOI":"10.1109\/ICCV.2019.00732"},{"key":"15981_CR372","doi-asserted-by":"crossref","unstructured":"Yuan L and Lu F 2018 Real-Time Ear Detection Based On Embedded Systems. In: 2018 International Conference on Machine Learning and Cybernetics (ICMLC). IEEE, 115\u2013120","DOI":"10.1109\/ICMLC.2018.8526987"},{"key":"15981_CR373","doi-asserted-by":"publisher","unstructured":"Yuan J, Xiong HC, Xiao Y, et al (2020) Gated CNN: Integrating multi-scale feature layers for object detection. Pattern Recognit 105:107131. https:\/\/doi.org\/10.1016\/j.patcog.2019.107131","DOI":"10.1016\/j.patcog.2019.107131"},{"key":"15981_CR374","doi-asserted-by":"publisher","unstructured":"Yuan Y, Chen L, Wu H, Li L (2021) Advanced agricultural disease image recognition technologies: A review.\u00a0Inf Process Agric\u00a09(1):1\u201312. https:\/\/doi.org\/10.1016\/j.inpa.2021.01.003","DOI":"10.1016\/j.inpa.2021.01.003"},{"issue":"5","key":"15981_CR375","doi-asserted-by":"publisher","first-page":"931","DOI":"10.1049\/cje.2021.07.004","volume":"30","author":"Y Yuanchen","year":"2021","unstructured":"Yuanchen Y, Yunfei C, Dongsheng W (2021) GridNet-3D: A Novel Real-Time 3D Object Detection Algorithm Based on Point Cloud. Chin J Electron 30(5):931\u2013939. https:\/\/doi.org\/10.1049\/cje.2021.07.004","journal-title":"Chin J Electron"},{"key":"15981_CR376","unstructured":"Yucel MK, Bilge YC, Oguz O, et al. 2018 Wildest Faces: Face Detection and Recognition in Violent Settings"},{"key":"15981_CR377","unstructured":"Yuliang L, Lianwen J, Shuaitao Z and Sheng Z 2017 Detecting Curve Text in the Wild: New Dataset and New Solution"},{"key":"15981_CR378","doi-asserted-by":"publisher","unstructured":"Zakria Z, Deng J, Kumar R, et al 2022 Multiscale and Direction Target Detecting in Remote Sensing Images via Modified YOLO-v4. IEEE J Sel Top Appl Earth Obs Remote Sens 151039\u20131048. https:\/\/doi.org\/10.1109\/JSTARS.2022.3140776","DOI":"10.1109\/JSTARS.2022.3140776"},{"key":"15981_CR379","doi-asserted-by":"crossref","unstructured":"Zhang H and Hong X 2019 Recent progresses on object detection: a brief review. In: Multimedia Tools and Applications. Multimedia Tools and Applications, pp. 27809\u201327847","DOI":"10.1007\/s11042-019-07898-2"},{"issue":"11","key":"15981_CR380","doi-asserted-by":"publisher","first-page":"9682","DOI":"10.1109\/TGRS.2020.3045708","volume":"59","author":"L Zhang","year":"2021","unstructured":"Zhang L, Ma J (2021) Salient Object Detection Based on Progressively Supervised Learning for Remote Sensing Images. IEEE Trans Geosci Remote Sens 59(11):9682\u20139696. https:\/\/doi.org\/10.1109\/TGRS.2020.3045708","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"15981_CR381","doi-asserted-by":"publisher","unstructured":"Zhang Q, Wan C and Jiang M 2017 Multiple objects detection based on improved faster RCNN. ACM Int Conf Proceeding Ser, pp. 99\u2013103. https:\/\/doi.org\/10.1145\/3163080.3163101","DOI":"10.1145\/3163080.3163101"},{"key":"15981_CR382","doi-asserted-by":"crossref","unstructured":"Zhang S, Benenson R and Schiele B 2017 CityPersons: A Diverse Dataset for Pedestrian Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 4457\u20134465","DOI":"10.1109\/CVPR.2017.474"},{"key":"15981_CR383","doi-asserted-by":"crossref","unstructured":"Zhang S, Zhu X, Lei Z, et al 2017 S^3FD: Single Shot Scale-Invariant Face Detector. In: 2017 IEEE International Conference on Computer Vision (ICCV). IEEE, pp. 192\u2013201","DOI":"10.1109\/ICCV.2017.30"},{"issue":"6\u20137","key":"15981_CR384","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1007\/s11263-019-01159-3","volume":"127","author":"S Zhang","year":"2019","unstructured":"Zhang S, Wen L, Shi H et al (2019) Single-Shot Scale-Aware Network for Real-Time Face Detection. Int J Comput Vis 127(6\u20137):537\u2013559. https:\/\/doi.org\/10.1007\/s11263-019-01159-3","journal-title":"Int J Comput Vis"},{"key":"15981_CR385","doi-asserted-by":"publisher","unstructured":"Zhang W, Liu X, Yuan J, et al 2019 RCNN-based foreign object detection for securing power transmission lines (RCNN4SPTL). Procedia Comput Sci 147:331\u2013337. https:\/\/doi.org\/10.1016\/j.procs.2019.01.232","DOI":"10.1016\/j.procs.2019.01.232"},{"key":"15981_CR386","doi-asserted-by":"publisher","unstructured":"Zhang J, Wu X, Hoi SCH and Zhu J 2020 Feature agglomeration networks for single stage face detection. Neurocomputing 380:180\u2013189. https:\/\/doi.org\/10.1016\/j.neucom.2019.10.087","DOI":"10.1016\/j.neucom.2019.10.087"},{"key":"15981_CR387","doi-asserted-by":"publisher","unstructured":"Zhang J, Xie Z, Sun J et al (2020) A Cascaded R-CNN With Multiscale Attention and Imbalanced Samples for Traffic Sign Detection. IEEE Access 8:29742\u201329754. https:\/\/doi.org\/10.1109\/ACCESS.2020.2972338","DOI":"10.1109\/ACCESS.2020.2972338"},{"key":"15981_CR388","doi-asserted-by":"crossref","unstructured":"Zhang M, Liu T, Piao Y, et al 2021 Auto-MSFNet: Search Multi-scale Fusion Network for Salient Object Detection. In: Proceedings of the 29th ACM International Conference on Multimedia. ACM, New York, NY, USA, 667\u2013676","DOI":"10.1145\/3474085.3475231"},{"issue":"8","key":"15981_CR389","doi-asserted-by":"publisher","first-page":"5633","DOI":"10.1007\/s10462-021-09967-1","volume":"54","author":"W Zhang","year":"2021","unstructured":"Zhang W, Li H, Li Y et al (2021) Application of deep learning algorithms in geotechnical engineering: a short critical review. Artif Intell Rev 54(8):5633\u20135673. https:\/\/doi.org\/10.1007\/s10462-021-09967-1","journal-title":"Artif Intell Rev"},{"issue":"S1","key":"15981_CR390","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1080\/21642583.2020.1824132","volume":"9","author":"X Zhang","year":"2021","unstructured":"Zhang X, Wang W, Zhao Y, Xie H (2021) An improved YOLOv3 model based on skipping connections and spatial pyramid pooling. Syst Sci Control Eng 9(S1):142\u2013149. https:\/\/doi.org\/10.1080\/21642583.2020.1824132","journal-title":"Syst Sci Control Eng"},{"key":"15981_CR391","doi-asserted-by":"publisher","unstructured":"Zhang X, Liu Y, Huo C, et al 2022 PSNet: Perspective-sensitive convolutional network for object detection. Neurocomputing 468:384\u2013395. https:\/\/doi.org\/10.1016\/j.neucom.2021.10.068","DOI":"10.1016\/j.neucom.2021.10.068"},{"issue":"c","key":"15981_CR392","doi-asserted-by":"publisher","first-page":"43607","DOI":"10.1109\/ACCESS.2019.2908016","volume":"7","author":"W Zhao","year":"2019","unstructured":"Zhao W, Ma W, Jiao L et al (2019) Multi-Scale Image Block-Level F-CNN for Remote Sensing Images Object Detection. IEEE. Access 7(c):43607\u201343621. https:\/\/doi.org\/10.1109\/ACCESS.2019.2908016","journal-title":"Access"},{"issue":"11","key":"15981_CR393","doi-asserted-by":"publisher","first-page":"3212","DOI":"10.1109\/TNNLS.2018.2876865","volume":"30","author":"Z-QQ Zhao","year":"2019","unstructured":"Zhao Z-QQ, Zheng P, Xu S-TT, Wu X (2019) Object Detection With Deep Learning: A Review. IEEE Trans Neural Networks Learn Syst 30(11):3212\u20133232. https:\/\/doi.org\/10.1109\/TNNLS.2018.2876865","journal-title":"IEEE Trans Neural Networks Learn Syst"},{"issue":"15","key":"15981_CR394","doi-asserted-by":"publisher","first-page":"5764","DOI":"10.1080\/01431161.2021.1931537","volume":"42","author":"X Zhao","year":"2021","unstructured":"Zhao X, Zhang J, Tian J et al (2021) Multiscale object detection in high-resolution remote sensing images via rotation invariant deep features driven by channel attention. Int J Remote Sens 42(15):5764\u20135783. https:\/\/doi.org\/10.1080\/01431161.2021.1931537","journal-title":"Int J Remote Sens"},{"key":"15981_CR395","doi-asserted-by":"crossref","unstructured":"Zhiqiang W and Jun L 2017 A review of object detection based on convolutional neural network. In: 2017 36th Chinese Control Conference (CCC). IEEE, 11104\u201311109","DOI":"10.23919\/ChiCC.2017.8029130"},{"key":"15981_CR396","doi-asserted-by":"publisher","unstructured":"Zhong Z, Sun L and Huo Q 2019 Improved localization accuracy by LocNet for Faster R-CNN based text detection in natural scene images. Pattern Recognit 96:106986. https:\/\/doi.org\/10.1016\/j.patcog.2019.106986","DOI":"10.1016\/j.patcog.2019.106986"},{"issue":"3","key":"15981_CR397","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1007\/s10032-019-00335-y","volume":"22","author":"Z Zhong","year":"2019","unstructured":"Zhong Z, Sun L, Huo Q (2019) An anchor-free region proposal network for Faster R-CNN-based text detection approaches. Int J Doc Anal Recognit 22(3):315\u2013327. https:\/\/doi.org\/10.1007\/s10032-019-00335-y","journal-title":"Int J Doc Anal Recognit"},{"key":"15981_CR398","doi-asserted-by":"crossref","unstructured":"Zhou P, Han X, Morariu VI and Davis LS 2017 Two-Stream Neural Networks for Tampered Face Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW). IEEE, 1831\u20131839","DOI":"10.1109\/CVPRW.2017.229"},{"issue":"1","key":"15981_CR399","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1007\/s41095-020-0199-z","volume":"7","author":"T Zhou","year":"2021","unstructured":"Zhou T, Fan DP, Cheng MM et al (2021) RGB-D salient object detection: A survey. Comput Vis Media 7(1):37\u201369. https:\/\/doi.org\/10.1007\/s41095-020-0199-z","journal-title":"Comput Vis Media"},{"key":"15981_CR400","doi-asserted-by":"publisher","unstructured":"Zhu Y and Du J 2021 TextMountain: Accurate scene text detection via instance segmentation. Pattern Recognit 110:107336. https:\/\/doi.org\/10.1016\/j.patcog.2020.107336","DOI":"10.1016\/j.patcog.2020.107336"},{"key":"15981_CR401","doi-asserted-by":"publisher","unstructured":"Zhu Y and Jiang Y 2020 Optimization of face recognition algorithm based on deep learning multi feature fusion driven by big data. Image Vis Comput 104:104023. https:\/\/doi.org\/10.1016\/j.imavis.2020.104023","DOI":"10.1016\/j.imavis.2020.104023"},{"key":"15981_CR402","doi-asserted-by":"crossref","unstructured":"Zhu H, Chen X, Dai W, et al 2015 Orientation robust object detection in aerial images using deep convolutional neural network. In: 2015 IEEE International Conference on Image Processing (ICIP). IEEE, pp. 3735\u20133739","DOI":"10.1109\/ICIP.2015.7351502"},{"key":"15981_CR403","doi-asserted-by":"crossref","unstructured":"Zhu Z, Liang D, Zhang S, et al 2016 Traffic-Sign Detection and Classification in the Wild. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp. 2110\u20132118","DOI":"10.1109\/CVPR.2016.232"},{"issue":"10","key":"15981_CR404","doi-asserted-by":"publisher","first-page":"959","DOI":"10.1080\/2150704X.2019.1633486","volume":"10","author":"H Zhu","year":"2019","unstructured":"Zhu H, Zhang P, Wang L et al (2019) A multiscale object detection approach for remote sensing images based on MSE-DenseNet and the dynamic anchor assignment. Remote Sens Lett 10(10):959\u2013967. https:\/\/doi.org\/10.1080\/2150704X.2019.1633486","journal-title":"Remote Sens Lett"},{"key":"15981_CR405","first-page":"391","volume-title":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","author":"CL Zitnick","year":"2014","unstructured":"Zitnick CL, Doll\u00e1r P (2014) Edge Boxes: Locating Object Proposals from Edges. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). Springer, pp 391\u2013405"},{"issue":"3","key":"15981_CR406","doi-asserted-by":"publisher","first-page":"1100","DOI":"10.1109\/TIP.2017.2773199","volume":"27","author":"Z Zou","year":"2018","unstructured":"Zou Z, Shi Z (2018) Random access memories: A new paradigm for target detection in high resolution aerial remote sensing images. IEEE Trans Image Process 27(3):1100\u20131111. https:\/\/doi.org\/10.1109\/TIP.2017.2773199","journal-title":"IEEE Trans Image Process"},{"key":"15981_CR407","unstructured":"Zou Z, Shi Z, Guo Y and Ye J 2019 Object Detection in 20 Years: A Survey. 1\u201339"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-15981-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-15981-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-15981-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T22:06:27Z","timestamp":1729634787000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-15981-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,24]]},"references-count":407,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,1]]}},"alternative-id":["15981"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-15981-y","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,6,24]]},"assertion":[{"value":"30 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 May 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 June 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 June 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflicts of interest to declare relevant to this article\u2019s content.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}},{"value":"This article does not contain any studies with human participants or animals performed by the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}}]}}