{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T21:09:58Z","timestamp":1781816998292,"version":"3.54.5"},"reference-count":221,"publisher":"Springer Science and Business Media LLC","issue":"27","license":[{"start":{"date-parts":[[2022,4,23]],"date-time":"2022-04-23T00:00:00Z","timestamp":1650672000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,4,23]],"date-time":"2022-04-23T00:00:00Z","timestamp":1650672000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2022,11]]},"DOI":"10.1007\/s11042-022-13153-y","type":"journal-article","created":{"date-parts":[[2022,4,23]],"date-time":"2022-04-23T00:02:20Z","timestamp":1650672140000},"page":"38297-38351","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":174,"title":["Tools, techniques, datasets and application areas for object detection in an image: a review"],"prefix":"10.1007","volume":"81","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8819-7327","authenticated-orcid":false,"given":"Jaskirat","family":"Kaur","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Williamjeet","family":"Singh","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2022,4,23]]},"reference":[{"issue":"41\u201342","key":"13153_CR1","doi-asserted-by":"publisher","first-page":"31645","DOI":"10.1007\/s11042-020-09662-3","volume":"79","author":"M Afif","year":"2020","unstructured":"Afif M, Ayachi R, Pissaloux E, Said Y, Atri M (2020) Indoor objects detection and recognition for an ICT mobility assistance of visually impaired people. Multimed Tools Appl 79(41\u201342):31645\u201331662. https:\/\/doi.org\/10.1007\/s11042-020-09662-3","journal-title":"Multimed Tools Appl"},{"issue":"1","key":"13153_CR2","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s13177-019-00178-1","volume":"18","author":"A Alam","year":"2020","unstructured":"Alam A, Jaffery ZA (2020) Indian Traffic Sign Detection and Recognition. Int J Intell Transp Syst Res 18(1):98\u2013112. https:\/\/doi.org\/10.1007\/s13177-019-00178-1","journal-title":"Int J Intell Transp Syst Res"},{"key":"13153_CR3","doi-asserted-by":"publisher","unstructured":"Bach M, Stumper D, Dietmayer K (2018) Deep Convolutional Traffic Light Recognition for Automated Driving, in 2018 21st International Conference on Intelligent Transportation Systems (ITSC), IEEE, vol. 2018-Novem, 851\u2013858, https:\/\/doi.org\/10.1109\/ITSC.2018.8569522","DOI":"10.1109\/ITSC.2018.8569522"},{"key":"13153_CR4","doi-asserted-by":"publisher","unstructured":"Banerjee K, Notz D, Windelen J, Gavarraju S, He M (2018) Online Camera LiDAR Fusion and Object Detection on Hybrid Data for Autonomous Driving, in 2018 IEEE Intelligent Vehicles Symposium (IV), IEEE, vol. 2018-June, no. Iv, 1632\u20131638, https:\/\/doi.org\/10.1109\/IVS.2018.8500699","DOI":"10.1109\/IVS.2018.8500699"},{"key":"13153_CR5","doi-asserted-by":"publisher","unstructured":"Becker BC, Ortiz EG (2008) Evaluation of face recognition techniques for application to facebook, in 2008 8th IEEE International Conference on Automatic Face & Gesture Recognition, IEEE, pp. 1\u20136, https:\/\/doi.org\/10.1109\/AFGR.2008.4813471","DOI":"10.1109\/AFGR.2008.4813471"},{"key":"13153_CR6","doi-asserted-by":"publisher","unstructured":"Behrendt K, Novak L, Botros R (2017) A deep learning approach to traffic lights: Detection, tracking, and classification, in 2017 IEEE International Conference on Robotics and Automation (ICRA), IEEE, 1370\u20131377, https:\/\/doi.org\/10.1109\/ICRA.2017.7989163","DOI":"10.1109\/ICRA.2017.7989163"},{"key":"13153_CR7","doi-asserted-by":"publisher","unstructured":"Bhandari A, Prasad PWC, Alsadoon A, Maag A (2021) Object detection and recognition: using deep learning to assist the visually impaired, Disabil Rehabil Assist Technol, 1\u20139, 2019, Taylor & Francis, https:\/\/doi.org\/10.1080\/17483107.2019.1673834","DOI":"10.1080\/17483107.2019.1673834"},{"issue":"2019","key":"13153_CR8","doi-asserted-by":"publisher","first-page":"770","DOI":"10.1016\/j.procs.2020.04.084","volume":"171","author":"U Bhangale","year":"2020","unstructured":"Bhangale U, Patil S, Vishwanath V, Thakker P, Bansode A, Navandhar D (2020, Elsevier B.V.) Near real-time crowd counting using deep learning approach. Procedia Comput Sci 171(2019):770\u2013779. https:\/\/doi.org\/10.1016\/j.procs.2020.04.084","journal-title":"Procedia Comput Sci"},{"key":"13153_CR9","unstructured":"Bochkovskiy A, Wang C, Liao HM (2020) YOLOv4: Optimal Speed and Accuracy of Object Detection, [Online]. Available: http:\/\/arxiv.org\/abs\/2004.10934"},{"key":"13153_CR10","doi-asserted-by":"publisher","unstructured":"Bouras C, Michos E (2022) An online real-time face recognition system for police purposes, in 2022 International Conference on Information Networking (ICOIN), IEEE, pp. 62\u201367, https:\/\/doi.org\/10.1109\/ICOIN53446.2022.9687212","DOI":"10.1109\/ICOIN53446.2022.9687212"},{"issue":"9","key":"13153_CR11","doi-asserted-by":"publisher","first-page":"6721","DOI":"10.1007\/s00500-019-04307-6","volume":"24","author":"A Bouti","year":"2020","unstructured":"Bouti A, Mahraz MA, Riffi J, Tairi H (2020, Springer Berlin Heidelberg) A robust system for road sign detection and classification using LeNet architecture based on convolutional neural network. Soft Comput 24(9):6721\u20136733. https:\/\/doi.org\/10.1007\/s00500-019-04307-6","journal-title":"Soft Comput"},{"issue":"8","key":"13153_CR12","doi-asserted-by":"publisher","first-page":"1844","DOI":"10.1109\/TPAMI.2019.2897684","volume":"41","author":"M Braun","year":"2019","unstructured":"Braun M, Krebs S, Flohr F, Gavrila DM (2019, IEEE) EuroCity Persons: A Novel Benchmark for Person Detection in Traffic Scenes. IEEE Trans Pattern Anal Mach Intell 41(8):1844\u20131861. https:\/\/doi.org\/10.1109\/TPAMI.2019.2897684","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13153_CR13","doi-asserted-by":"publisher","unstructured":"Caesar H et al. (2020) nuScenes: A multimodal dataset for autonomous driving, in 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, no. March, pp 11618\u201311628, https:\/\/doi.org\/10.1109\/CVPR42600.2020.01164","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"13153_CR14","doi-asserted-by":"publisher","unstructured":"Ch\u2019ng CK, Chan CS (2017) Total-Text: a comprehensive dataset for scene text detection and recognition, in 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 935\u2013942, https:\/\/doi.org\/10.1109\/ICDAR.2017.157","DOI":"10.1109\/ICDAR.2017.157"},{"key":"13153_CR15","doi-asserted-by":"publisher","unstructured":"Chatterjee S, Zunjani FH, Nandi GC (2020) Real-time object detection and recognition on low-compute humanoid robots using deep learning, in 2020 6th International Conference on Control, Automation and Robotics (ICCAR), IEEE, pp. 202\u2013208, https:\/\/doi.org\/10.1109\/ICCAR49639.2020.9108054.","DOI":"10.1109\/ICCAR49639.2020.9108054"},{"key":"13153_CR16","doi-asserted-by":"publisher","unstructured":"Chen IK, Chi CY, Hsu SL, Chen LG (2014) A real-time system for object detection and location reminding with RGB-D camera, 2014 IEEE Int.Conf Consum. Electron., 412\u2013413, https:\/\/doi.org\/10.1109\/ICCE.2014.6776063","DOI":"10.1109\/ICCE.2014.6776063"},{"issue":"1","key":"13153_CR17","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1080\/07038992.2021.1894915","volume":"47","author":"Z Chen","year":"2021","unstructured":"Chen Z, Luo R, Li J, Du J, Wang C (2021, Taylor & Francis) U-Net based road area guidance for crosswalks detection from remote sensing images. Can J Remote Sens 47(1):83\u201399. https:\/\/doi.org\/10.1080\/07038992.2021.1894915","journal-title":"Can J Remote Sens"},{"key":"13153_CR18","doi-asserted-by":"publisher","unstructured":"Chen Y, Wang W, Zhou Y, Yang F, Yang D, Wang W (2021) Self-training for domain adaptive scene text detection, in 2020 25th International Conference on Pattern Recognition (ICPR), IEEE, pp. 850\u2013857, https:\/\/doi.org\/10.1109\/ICPR48806.2021.9412558","DOI":"10.1109\/ICPR48806.2021.9412558"},{"issue":"4","key":"13153_CR19","doi-asserted-by":"publisher","first-page":"1121","DOI":"10.1007\/s11263-020-01412-0","volume":"129","author":"Z Chen","year":"2021","unstructured":"Chen Z, Ouyang W, Liu T, Tao D (2021, Springer US) A shape transformation-based dataset augmentation framework for pedestrian detection. Int J Comput Vis 129(4):1121\u20131138. https:\/\/doi.org\/10.1007\/s11263-020-01412-0","journal-title":"Int J Comput Vis"},{"key":"13153_CR20","doi-asserted-by":"publisher","unstructured":"Cheng G, Han J (2016) A survey on object detection in optical remote sensing images, ISPRS J Photogramm Remote Sens, 117, 11\u201328, Elsevier, https:\/\/doi.org\/10.1016\/j.isprsjprs.2016.03.014.","DOI":"10.1016\/j.isprsjprs.2016.03.014"},{"key":"13153_CR21","doi-asserted-by":"publisher","unstructured":"Cordts M et al. (2016) The Cityscapes Dataset for Semantic Urban Scene Understanding, in 2016 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, 29(5), 3213\u20133223, https:\/\/doi.org\/10.1109\/CVPR.2016.350.","DOI":"10.1109\/CVPR.2016.350"},{"key":"13153_CR22","doi-asserted-by":"publisher","unstructured":"Dalal N, Triggs B (2005) Histograms of oriented gradients for human detection, in 2005 IEEE computer society conference on computer vision and pattern recognition (CVPR\u201905), IEEE, pp. 886\u2013893, https:\/\/doi.org\/10.1109\/CVPR.2005.177","DOI":"10.1109\/CVPR.2005.177"},{"key":"13153_CR23","unstructured":"Dam GC, Management A (2019) U. S. Geological survey grand canyon monitoring fiscal year 2019 Annual Project Report to the Glen Canyon Dam Adaptive Management"},{"key":"13153_CR24","doi-asserted-by":"crossref","unstructured":"Dasiopoulou S, Giannakidou E, Litos G, Malasioti P, Kompatsiaris Y (2011) A survey of semantic image and video annotation tools, in Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. LNAI 6050, Springer, Springer, pp. 196\u2013239","DOI":"10.1007\/978-3-642-20795-2_8"},{"key":"13153_CR25","doi-asserted-by":"publisher","unstructured":"de Charette R, Nashashibi F (2009) Traffic light recognition using image processing compared to learning processes, in 2009 IEEE\/RSJ International Conference on Intelligent Robots and Systems, IEEE, pp. 333\u2013338, https:\/\/doi.org\/10.1109\/IROS.2009.5353941","DOI":"10.1109\/IROS.2009.5353941"},{"key":"13153_CR26","doi-asserted-by":"publisher","unstructured":"Deng J, Dong W, Socher R, Li L-J, Li K, Fei-Fei L (2009) ImageNet: A large-scale hierarchical image database, in 2009 IEEE conference on computer vision and pattern recognition, IEEE, 248\u2013255, https:\/\/doi.org\/10.1109\/CVPR.2009.5206848","DOI":"10.1109\/CVPR.2009.5206848"},{"issue":"19","key":"13153_CR27","doi-asserted-by":"publisher","first-page":"14429","DOI":"10.1007\/s00500-020-04795-x","volume":"24","author":"S Dhivya","year":"2020","unstructured":"Dhivya S, Sangeetha J, Sudhakar B (2020, Springer Berlin Heidelberg) Copy-move forgery detection using SURF feature extraction and SVM supervised learning technique. Soft Comput 24(19):14429\u201314440. https:\/\/doi.org\/10.1007\/s00500-020-04795-x","journal-title":"Soft Comput"},{"key":"13153_CR28","doi-asserted-by":"publisher","unstructured":"Dollar P, Wojek C, Schiele B, Perona P (2009) Pedestrian detection: A benchmark, in 2009 IEEE Conference on Computer Vision and Pattern Recognition, IEEE, 304\u2013311, https:\/\/doi.org\/10.1109\/CVPR.2009.5206631","DOI":"10.1109\/CVPR.2009.5206631"},{"key":"13153_CR29","doi-asserted-by":"publisher","unstructured":"Dollar P, Wojek C, Schiele B, Perona P (2012) Pedestrian detection: an evaluation of the state of the art, in IEEE transactions on pattern analysis and machine intelligence 34(4), 743\u2013761, https:\/\/doi.org\/10.1109\/TPAMI.2011.155","DOI":"10.1109\/TPAMI.2011.155"},{"key":"13153_CR30","doi-asserted-by":"publisher","unstructured":"Dominguez-Sanchez A, Orts-Escolano S, Garcia-Rodriguez J, Cazorla M (2018) A New Dataset and Performance Evaluation of a Region-based CNN for Urban Object Detection, in 2018 International Joint Conference on Neural Networks (IJCNN), IEEE, pp. 1\u20138, https:\/\/doi.org\/10.1109\/IJCNN.2018.8489478.","DOI":"10.1109\/IJCNN.2018.8489478"},{"key":"13153_CR31","doi-asserted-by":"publisher","unstructured":"Du F, Wang WL, Zhang Z (2020) Pedestrian detection based on a hybrid Gaussian model and support vector machine, Enterp Inf Syst, 1\u201312, Taylor & Francis, https:\/\/doi.org\/10.1080\/17517575.2020.1791363.","DOI":"10.1080\/17517575.2020.1791363"},{"key":"13153_CR32","doi-asserted-by":"publisher","unstructured":"Dutta A, Zisserman A (2019) The VIA Annotation Software for Images, Audio and Video, in Proceedings of the 27th ACM International Conference on Multimedia, ACM, pp. 2276\u20132279, https:\/\/doi.org\/10.1145\/3343031.3350535.","DOI":"10.1145\/3343031.3350535"},{"key":"13153_CR33","unstructured":"Ertler C, Mislej J, Ollmann T, Porzi L, Neuhold G, Kuang Y (2019) The Mapillary Traffic Sign Dataset for Detection and Classification on a Global Scale, Comput Vis Pattern Recognit, 1\u201317, [Online]. Available: http:\/\/arxiv.org\/abs\/1909.04422"},{"key":"13153_CR34","doi-asserted-by":"publisher","unstructured":"Everingham M et al. (2006) The 2005 PASCAL Visual Object Classes Challenge, in Machine Learning Challenges. Evaluating Predictive Uncertainty, Visual Object Classification, and Recognising Tectual Entailment. MLCW 2005. Lecture Notes in Computer Science, Springer Berlin Heidelberg, vol. 3944 LNAI, pp. 117\u2013176, https:\/\/doi.org\/10.1007\/11736790_8.","DOI":"10.1007\/11736790_8"},{"issue":"2","key":"13153_CR35","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham M, Van Gool L, Williams CKI, Winn J, Zisserman A (2010) The Pascal visual object classes (VOC) challenge. Int J Comput Vis 88(2):303\u2013338. https:\/\/doi.org\/10.1007\/s11263-009-0275-4","journal-title":"Int J Comput Vis"},{"issue":"1","key":"13153_CR36","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham M, Eslami SMA, Van Gool L, Williams CKI, Winn J, Zisserman A (2015, Springer) The pascal visual object classes challenge: A Retrospective. Int J Comput Vis 111(1):98\u2013136. https:\/\/doi.org\/10.1007\/s11263-014-0733-5","journal-title":"Int J Comput Vis"},{"key":"13153_CR37","doi-asserted-by":"publisher","unstructured":"Felzenszwalb P, McAllester D, Ramanan D (2008) A discriminatively trained, multiscale, deformable part model, in 2008 IEEE conference on computer vision and pattern recognition, IEEE, 1\u20138, https:\/\/doi.org\/10.1109\/CVPR.2008.4587597","DOI":"10.1109\/CVPR.2008.4587597"},{"key":"13153_CR38","doi-asserted-by":"publisher","unstructured":"Fregin A, Muller J, Krebel U, Dietmayer K (2018) The DriveU Traffic Light Dataset: Introduction and Comparison with Existing Datasets, in 2018 IEEE International Conference on Robotics and Automation (ICRA), IEEE, 3376\u20133383, https:\/\/doi.org\/10.1109\/ICRA.2018.8460737","DOI":"10.1109\/ICRA.2018.8460737"},{"key":"13153_CR39","doi-asserted-by":"publisher","unstructured":"Fu M, Huang Y (2010) A survey of traffic sign recognition, in 2010 International Conference on Wavelet Analysis and Pattern Recognition, IEEE, pp. 119\u2013124, https:\/\/doi.org\/10.1109\/ICWAPR.2010.5576425","DOI":"10.1109\/ICWAPR.2010.5576425"},{"issue":"January","key":"13153_CR40","doi-asserted-by":"publisher","first-page":"294","DOI":"10.1016\/j.isprsjprs.2020.01.025","volume":"161","author":"K Fu","year":"2020","unstructured":"Fu K, Chang Z, Zhang Y, Xu G, Zhang K, Sun X (2020, Elsevier) Rotation-aware and multi-scale convolutional neural network for object detection in remote sensing images. ISPRS J Photogramm Remote Sens 161(January):294\u2013308. https:\/\/doi.org\/10.1016\/j.isprsjprs.2020.01.025","journal-title":"ISPRS J Photogramm Remote Sens"},{"issue":"17\u201318","key":"13153_CR41","doi-asserted-by":"publisher","first-page":"12615","DOI":"10.1007\/s11042-019-08523-y","volume":"79","author":"J Fu","year":"2020","unstructured":"Fu J, Zhao C, Xia Y, Liu W (2020) Vehicle and wheel detection: a novel SSD-based approach and associated large-scale benchmark dataset. Multimed Tools Appl 79(17\u201318):12615\u201312634. https:\/\/doi.org\/10.1007\/s11042-019-08523-y","journal-title":"Multimed Tools Appl"},{"key":"13153_CR42","unstructured":"Fu C, Liu W, Ranga A, Tyagi A, Berg AC (n.d.) DSSD : Deconvolutional Single Shot Detector"},{"key":"13153_CR43","doi-asserted-by":"publisher","unstructured":"Gawande U, Hajari K, Golhar Y (2022) SIRA: scale illumination rotation affine invariant mask R-CNN for pedestrian detection. Appl Intell, no. 0123456789, Springer US, https:\/\/doi.org\/10.1007\/s10489-021-03073-z.","DOI":"10.1007\/s10489-021-03073-z"},{"key":"13153_CR44","doi-asserted-by":"publisher","first-page":"272","DOI":"10.1016\/j.neucom.2021.07.094","volume":"462","author":"Z Ge","year":"2021","unstructured":"Ge Z, Wang J, Huang X, Liu S, Yoshie O (2021, Elsevier) LLA: loss-aware label assignment for dense pedestrian detection. Neurocomputing 462:272\u2013281. https:\/\/doi.org\/10.1016\/j.neucom.2021.07.094","journal-title":"Neurocomputing"},{"key":"13153_CR45","doi-asserted-by":"publisher","unstructured":"Geiger A, Lenz P, Urtasun R (2012) Are we ready for autonomous driving? The KITTI vision benchmark suite\u201d, in 2012 IEEE conference on computer vision and pattern recognition, IEEE, pp. 3354\u20133361, https:\/\/doi.org\/10.1109\/CVPR.2012.6248074","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"13153_CR46","doi-asserted-by":"publisher","unstructured":"Girshick R (2015) Fast R-CNN, in 2015 IEEE International Conference on Computer Vision (ICCV), IEEE, pp. 1440\u20131448, https:\/\/doi.org\/10.1109\/ICCV.2015.169","DOI":"10.1109\/ICCV.2015.169"},{"issue":"1","key":"13153_CR47","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1109\/TPAMI.2015.2437384","volume":"38","author":"R Girshick","year":"2015","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2015) Region-based convolutional networks for accurate object detection and segmentation. IEEE Trans Pattern Anal Mach Intell 38(1):142\u2013158. https:\/\/doi.org\/10.1109\/TPAMI.2015.2437384","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"1","key":"13153_CR48","doi-asserted-by":"publisher","first-page":"8714","DOI":"10.1109\/ACCESS.2018.2801813","volume":"101","author":"BA Godinho De Oliveira","year":"2018","unstructured":"Godinho De Oliveira BA, Ferreira FMF, Martins CAPDS (2018) Fast and lightweight object detection network: detection and recognition on resource constrained devices. IEEE Access 101(1):8714\u20138724. https:\/\/doi.org\/10.1109\/ACCESS.2018.2801813","journal-title":"IEEE Access"},{"key":"13153_CR49","doi-asserted-by":"publisher","unstructured":"Grosicki E, El-Abed H (2011) ICDAR 2011 - French Handwriting Recognition Competition, in 2011 International Conference on Document Analysis and Recognition, IEEE, pp. 1459\u20131463, https:\/\/doi.org\/10.1109\/ICDAR.2011.290","DOI":"10.1109\/ICDAR.2011.290"},{"key":"13153_CR50","doi-asserted-by":"publisher","first-page":"108063","DOI":"10.1016\/j.patcog.2021.108063","volume":"119","author":"Z Guo","year":"2021","unstructured":"Guo Z, Liao W, Xiao Y, Veelaert P, Philips W (2021, Elsevier) Weak segmentation supervised deep neural networks for pedestrian detection. Pattern Recognit 119:108063. https:\/\/doi.org\/10.1016\/j.patcog.2021.108063","journal-title":"Pattern Recognit"},{"issue":"3","key":"13153_CR51","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1007\/s00371-020-01814-8","volume":"37","author":"S Gupta","year":"2021","unstructured":"Gupta S, Thakur K, Kumar M (2021, Springer) 2D-human face recognition using SIFT and SURF descriptors of face\u2019s feature regions. Vis Comput 37(3):447\u2013456. https:\/\/doi.org\/10.1007\/s00371-020-01814-8","journal-title":"Vis Comput"},{"key":"13153_CR52","doi-asserted-by":"publisher","unstructured":"Hadid A, Heikkila JY, Silven O, Pietikainen M (2007) Face and Eye Detection for Person Authentication in Mobile Phones, in 2007 First ACM\/IEEE International Conference on Distributed Smart Cameras, IEEE, pp. 101\u2013108, https:\/\/doi.org\/10.1109\/ICDSC.2007.4357512","DOI":"10.1109\/ICDSC.2007.4357512"},{"key":"13153_CR53","unstructured":"Halaschek-Wiener C, Golbeck J, Schain A, Grove M, Parsia B, Hendler J (2005) Photostuff - an image annotation tool for the semantic web, 4th Int. Semant. Web Conf. Poster Pap., pp. 2\u20134"},{"issue":"1","key":"13153_CR54","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1109\/MSP.2017.2749125","volume":"35","author":"J Han","year":"2018","unstructured":"Han J, Zhang D, Cheng G, Liu N, Xu D (2018) Advanced deep-learning techniques for salient and category-specific object detection: a survey. IEEE Signal Process Mag 35(1):84\u2013100. https:\/\/doi.org\/10.1109\/MSP.2017.2749125","journal-title":"IEEE Signal Process Mag"},{"issue":"10","key":"13153_CR55","doi-asserted-by":"publisher","first-page":"13263","DOI":"10.1007\/s11042-018-6428-0","volume":"78","author":"C Han","year":"2019","unstructured":"Han C, Gao G, Zhang Y (2019) Real-time small traffic sign detection with revised faster-RCNN. Multimed Tools Appl 78(10):13263\u201313278. https:\/\/doi.org\/10.1007\/s11042-018-6428-0","journal-title":"Multimed Tools Appl"},{"key":"13153_CR56","doi-asserted-by":"publisher","unstructured":"Harzallah H, Jurie F, Schmid C (2009) Combining efficient object localization and image classification, in 2009 IEEE 12th International Conference on Computer Vision, IEEE, pp. 237\u2013244, https:\/\/doi.org\/10.1109\/ICCV.2009.5459257","DOI":"10.1109\/ICCV.2009.5459257"},{"issue":"9","key":"13153_CR57","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (Sep. 2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9):1904\u20131916. https:\/\/doi.org\/10.1109\/TPAMI.2015.2389824","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13153_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patcog.2019.107026","volume":"98","author":"W He","year":"2020","unstructured":"He W, Zhang X-Y, Yin F, Luo Z, Ogier J-M, Liu C-L (2020, Elsevier Ltd) Realtime multi-scale scene text detection with scale-based region proposal network. Pattern Recognit 98:1\u201314. https:\/\/doi.org\/10.1016\/j.patcog.2019.107026","journal-title":"Pattern Recognit"},{"issue":"2","key":"13153_CR59","doi-asserted-by":"publisher","first-page":"386","DOI":"10.1109\/TPAMI.2018.284","volume":"42","author":"K He","year":"2020","unstructured":"He K, Gkioxari G, Dollar P, Girshick R (2020) Mask R-CNN. IEEE Trans Pattern Anal Mach Intell 42(2):386\u2013397, IEEE. https:\/\/doi.org\/10.1109\/TPAMI.2018.284","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13153_CR60","doi-asserted-by":"publisher","unstructured":"Heitz G, Koller D (2008) Learning spatial context: using stuff to find things, in European conference on computer vision, Springer, Berlin, Heidelberg, 30\u201343, https:\/\/doi.org\/10.1007\/978-3-540-88682-2_4.","DOI":"10.1007\/978-3-540-88682-2_4"},{"issue":"1","key":"13153_CR61","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1007\/s00779-020-01419-x","volume":"25","author":"HA Hosni Mahmoud","year":"2021","unstructured":"Hosni Mahmoud HA, Mengash HA (2021, springer) A novel technique for automated concealed face detection in surveillance videos. Pers Ubiquitous Comput 25(1):129\u2013140. https:\/\/doi.org\/10.1007\/s00779-020-01419-x","journal-title":"Pers Ubiquitous Comput"},{"key":"13153_CR62","doi-asserted-by":"publisher","unstructured":"Houben S, Stallkamp J, Salmen J, Schlipsing M, Igel C (2013) Detection of traffic signs in real-world images: The German traffic sign detection benchmark, in The 2013 International Joint Conference on Neural Networks (IJCNN), IEEE, pp. 1\u20138, https:\/\/doi.org\/10.1109\/IJCNN.2013.6706807","DOI":"10.1109\/IJCNN.2013.6706807"},{"key":"13153_CR63","doi-asserted-by":"publisher","unstructured":"Hu J, Zhao Y, Zhang X (2020) Application of transfer learning in infrared pedestrian detection, in 2020 IEEE 5th International Conference on Image, Vision and Computing (ICIVC), IEEE, pp. 1\u20134, https:\/\/doi.org\/10.1109\/ICIVC50857.2020.9177438","DOI":"10.1109\/ICIVC50857.2020.9177438"},{"key":"13153_CR64","doi-asserted-by":"publisher","first-page":"106495","DOI":"10.1016\/j.asoc.2020.106495","volume":"94","author":"X Hua","year":"2020","unstructured":"Hua X, Wang X, Rui T, Zhang H, Wang D (2020, Elsevier B.V.) A fast self-attention cascaded network for object detection in large scene remote sensing images. Appl Soft Comput 94:106495. https:\/\/doi.org\/10.1016\/j.asoc.2020.106495","journal-title":"Appl Soft Comput"},{"key":"13153_CR65","doi-asserted-by":"publisher","unstructured":"Huang Z et al. (2019) ICDAR2019 competition on scanned receipt OCR and information extraction, Proc Int Conf Doc Anal. Recognition, ICDAR, pp. 1516\u20131520, https:\/\/doi.org\/10.1109\/ICDAR.2019.00244.","DOI":"10.1109\/ICDAR.2019.00244"},{"key":"13153_CR66","doi-asserted-by":"publisher","first-page":"21777","DOI":"10.1109\/ACCESS.2021.3055243","volume":"9","author":"Q Huang","year":"2021","unstructured":"Huang Q, Cai Z, Lan T (2021, IEEE) A single neural network for mixed style license plate detection and recognition. IEEE Access 9:21777\u201321785. https:\/\/doi.org\/10.1109\/ACCESS.2021.3055243","journal-title":"IEEE Access"},{"key":"13153_CR67","doi-asserted-by":"crossref","unstructured":"Hung BT (2021) Face recognition using hybrid HOG-CNN approach, in International Journal of Image and Graphics, 1254, 715\u2013723","DOI":"10.1007\/978-981-15-7527-3_67"},{"issue":"2","key":"13153_CR68","doi-asserted-by":"publisher","first-page":"116","DOI":"10.1007\/s42979-020-00125-y","volume":"1","author":"GL Hung","year":"2020","unstructured":"Hung GL, Bin Sahimi MS, Samma H, Almohamad TA, Lahasan B (2020, Springer) Faster R-CNN deep learning model for pedestrian detection from drone images. SN Comput Sci 1(2):116. https:\/\/doi.org\/10.1007\/s42979-020-00125-y","journal-title":"SN Comput Sci"},{"key":"13153_CR69","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1007\/978-981-16-6636-0_13","volume":"95","author":"MS Irbaz","year":"2022","unstructured":"Irbaz MS, Al Nasim MA, Ferdous RE (2022) Real-time face recognition system for remote employee tracking. Lecture Notes on Data Engineering and Communications Technologies 95:153\u2013163","journal-title":"Lecture Notes on Data Engineering and Communications Technologies"},{"key":"13153_CR70","unstructured":"Jaderberg M, Simonyan K, Vedaldi A, Zisserman A (2014) Synthetic Data and Artificial Neural Networks for Natural Scene Text Recognition, pp. 1\u201310, [Online]. Available: http:\/\/arxiv.org\/abs\/1406.2227"},{"issue":"3","key":"13153_CR71","doi-asserted-by":"publisher","first-page":"125","DOI":"10.12700\/APH.17.3.2020.3.7","volume":"17","author":"J Jakob","year":"2020","unstructured":"Jakob J, Tick J (2020) Camera-based on-road detections for the visually impaired. Acta Polytech Hungarica 17(3):125\u2013146. https:\/\/doi.org\/10.12700\/APH.17.3.2020.3.7","journal-title":"Acta Polytech Hungarica"},{"issue":"1","key":"13153_CR72","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1016\/j.icte.2020.07.008","volume":"7","author":"Y Jamtsho","year":"2021","unstructured":"Jamtsho Y, Riyamongkol P, Waranusast R (2021, Elsevier B.V.) Real-time license plate detection for non-helmeted motorcyclist using YOLO. ICT Express 7(1):104\u2013109. https:\/\/doi.org\/10.1016\/j.icte.2020.07.008","journal-title":"ICT Express"},{"key":"13153_CR73","doi-asserted-by":"publisher","first-page":"107846","DOI":"10.1016\/j.patcog.2021.107846","volume":"115","author":"Y Jin","year":"2021","unstructured":"Jin Y, Zhang Y, Cen Y, Li Y, Mladenovic V, Voronin V (2021, Elsevier Ltd) Pedestrian detection with super-resolution reconstruction for low-quality image. Pattern Recognit 115:107846. https:\/\/doi.org\/10.1016\/j.patcog.2021.107846","journal-title":"Pattern Recognit"},{"key":"13153_CR74","doi-asserted-by":"publisher","unstructured":"Karatzas D, Mestre SR, Mas J, Nourbakhsh F, Roy PP (2011) ICDAR 2011 Robust Reading Competition - Challenge 1: Reading Text in Born-Digital Images (Web and Email), in 2011 International Conference on Document Analysis and Recognition, IEEE, pp. 1485\u20131490, https:\/\/doi.org\/10.1109\/ICDAR.2011.295.","DOI":"10.1109\/ICDAR.2011.295"},{"key":"13153_CR75","doi-asserted-by":"publisher","unstructured":"Kaur RP, Kumar M, Jindal MK (2022) Performance evaluation of different features and classifiers for Gurumukhi newspaper text recognition. J Ambient Intell Humaniz Comput no. 0123456789, Springer, https:\/\/doi.org\/10.1007\/s12652-021-03687-8","DOI":"10.1007\/s12652-021-03687-8"},{"issue":"4","key":"13153_CR76","first-page":"1383","volume":"2","author":"K Khurana","year":"2013","unstructured":"Khurana K, Awasthi R (2013) Techniques for object recognition in images and multi-object detection. Int J Adv Res Comput Eng Technol 2(4):1383\u20131388","journal-title":"Int J Adv Res Comput Eng Technol"},{"key":"13153_CR77","doi-asserted-by":"publisher","unstructured":"Klare BF et al. (2015) Pushing the frontiers of unconstrained face detection and recognition: IARPA Janus Benchmark A, in 2015 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, pp. 1931\u20131939, https:\/\/doi.org\/10.1109\/CVPR.2015.7298803.","DOI":"10.1109\/CVPR.2015.7298803"},{"key":"13153_CR78","doi-asserted-by":"publisher","unstructured":"Kostinger M, Wohlhart P, Roth PM, Bischof H (2011) Annotated Facial Landmarks in the Wild: A large-scale, real-world database for facial landmark localization, in 2011 IEEE International Conference on Computer Vision Workshops (ICCV Workshops), IEEE, pp. 2144\u20132151, https:\/\/doi.org\/10.1109\/ICCVW.2011.6130513","DOI":"10.1109\/ICCVW.2011.6130513"},{"key":"13153_CR79","doi-asserted-by":"publisher","unstructured":"Kumar R, Kumar S, Chand P, Lal S (2014) Object detection and recognition for a pick and place robot, in IEEE Asia-Pacific world congress on computer science and Engineering, 2014, 2\u20139, https:\/\/doi.org\/10.13140\/2.1.4379.2165","DOI":"10.13140\/2.1.4379.2165"},{"issue":"10","key":"13153_CR80","doi-asserted-by":"publisher","first-page":"14565","DOI":"10.1007\/s11042-020-10457-9","volume":"80","author":"A Kumar","year":"2021","unstructured":"Kumar A, Kumar M, Kaur A (2021, Springer) Face detection in still images under occlusion and non-uniform illumination. Multimed Tools Appl 80(10):14565\u201314590. https:\/\/doi.org\/10.1007\/s11042-020-10457-9","journal-title":"Multimed Tools Appl"},{"key":"13153_CR81","doi-asserted-by":"crossref","unstructured":"Kuznetsova A, Maleva T, Soloviev V (2020) Detecting Apples in Orchards Using YOLOv3 and YOLOv5 in General and Close-Up Images, in Neurocomputing, 149, no. Part A, 233\u2013243","DOI":"10.1007\/978-3-030-64221-1_20"},{"issue":"7","key":"13153_CR82","doi-asserted-by":"publisher","first-page":"1956","DOI":"10.1007\/s11263-020-01316-z","volume":"128","author":"A Kuznetsova","year":"2020","unstructured":"Kuznetsova A et al (2020, Springer) The open images dataset V4. Int J Comput Vis 128(7):1956\u20131981. https:\/\/doi.org\/10.1007\/s11263-020-01316-z","journal-title":"Int J Comput Vis"},{"key":"13153_CR83","unstructured":"LabelBox (2018) https:\/\/github.com\/Labelbox\/Labelbox\/blob\/master\/README.md."},{"key":"13153_CR84","unstructured":"Lam D et al. (2018) xView: Objects in Context in Overhead Imagery, [Online]. Available: http:\/\/arxiv.org\/abs\/1802.07856"},{"issue":"22","key":"13153_CR85","doi-asserted-by":"publisher","first-page":"16829","DOI":"10.1007\/s00500-020-04979-5","volume":"24","author":"PS Lamba","year":"2020","unstructured":"Lamba PS, Virmani D, Castillo O (2020, Springer Berlin Heidelberg) Multimodal human eye blink recognition method using feature level fusion for exigency detection. Soft Comput 24(22):16829\u201316845. https:\/\/doi.org\/10.1007\/s00500-020-04979-5","journal-title":"Soft Comput"},{"issue":"4","key":"13153_CR86","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1049\/itr2.12030","volume":"15","author":"R Laroca","year":"2021","unstructured":"Laroca R, Zanlorensi LA, Gon\u00e7alves GR, Todt E, Schwartz WR, Menotti D (2021, wiley) An efficient and layout-independent automatic license plate recognition system based on the YOLO detector. IET Intell Transp Syst 15(4):1\u201321. https:\/\/doi.org\/10.1049\/itr2.12030","journal-title":"IET Intell Transp Syst"},{"key":"13153_CR87","unstructured":"Learned-Miller E, Jain V (2010) FDDB : a benchmark for face detection in unconstrained settings"},{"key":"13153_CR88","doi-asserted-by":"publisher","unstructured":"Li J, Liang X, Wei Y, Xu T, Feng J, Yan S (2017) Perceptual generative adversarial networks for small object detection, in 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, 2017, 1951\u20131959, https:\/\/doi.org\/10.1109\/CVPR.2017.211","DOI":"10.1109\/CVPR.2017.211"},{"issue":"2019","key":"13153_CR89","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2020","unstructured":"Li K, Wan G, Cheng G, Meng L, Han J (2020, Elsevier) Object detection in optical remote sensing images: a survey and a new benchmark. ISPRS J Photogramm Remote Sens 159(2019):296\u2013307. https:\/\/doi.org\/10.1016\/j.isprsjprs.2019.11.023","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"13153_CR90","doi-asserted-by":"crossref","unstructured":"Li F, Luo Z, Huang J, Wang L, Cai J, Huang Y (2020) AlTwo: Vehicle Recognition in foggy weather based on two-step recognition algorithm, in Neurocomputing 149, no. Part A, Springer, Springer, pp. 130\u2013141.","DOI":"10.1007\/978-3-030-64221-1_12"},{"key":"13153_CR91","doi-asserted-by":"publisher","first-page":"411","DOI":"10.1016\/j.neucom.2020.05.108","volume":"415","author":"C Li","year":"2020","unstructured":"Li C et al (2020, Elsevier B.V.) A parallel down-up fusion network for salient object detection in optical remote sensing images. Neurocomputing 415:411\u2013420. https:\/\/doi.org\/10.1016\/j.neucom.2020.05.108","journal-title":"Neurocomputing"},{"issue":"1","key":"13153_CR92","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1007\/s44196-021-00056-3","volume":"15","author":"J Liao","year":"2022","unstructured":"Liao J, Liu Y, Piao Y, Su J, Cai G, Wu Y (2022, Springer) GLE-Net: A global and local ensemble network for aerial object detection. Int J Comput Intell Syst 15(1):2. https:\/\/doi.org\/10.1007\/s44196-021-00056-3","journal-title":"Int J Comput Intell Syst"},{"key":"13153_CR93","doi-asserted-by":"publisher","unstructured":"Lin T-Y, Goyal P, Girshick R, He K, Dollar P (2017) Focal loss for dense object detection, in 2017 IEEE International Conference on Computer Vision (ICCV), IEEE, 2999\u20133007, https:\/\/doi.org\/10.1109\/ICCV.2017.324.","DOI":"10.1109\/ICCV.2017.324"},{"issue":"9","key":"13153_CR94","doi-asserted-by":"publisher","first-page":"1938","DOI":"10.1109\/LGRS.2015.2439517","volume":"12","author":"K Liu","year":"2015","unstructured":"Liu K, Mattyus G (2015) Fast multiclass vehicle detection on aerial images. IEEE Geosci Remote Sens Lett 12(9):1938\u20131942. https:\/\/doi.org\/10.1109\/LGRS.2015.2439517","journal-title":"IEEE Geosci Remote Sens Lett"},{"key":"13153_CR95","doi-asserted-by":"crossref","unstructured":"Liu W et al. (2016) SSD: Single Shot MultiBox Detector, in European conference on computer vision, Springer, Springer, 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"13153_CR96","doi-asserted-by":"publisher","unstructured":"Liu Z, Wang H, Weng L, Yang Y (2016) Ship rotated bounding box space for ship extraction from high-resolution optical satellite images with complex backgrounds, IEEE Geosci Remote Sens Lett vol. 13, no. 8, pp. 1074\u20131078, IEEE, https:\/\/doi.org\/10.1109\/LGRS.2016.2565705","DOI":"10.1109\/LGRS.2016.2565705"},{"key":"13153_CR97","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.neucom.2020.05.027","volume":"409","author":"D Liu","year":"2020","unstructured":"Liu D, Cui Y, Chen Y, Zhang J, Fan B (2020, Elsevier B.V.) Video object detection for autonomous driving: motion-aid feature calibration. Neurocomputing 409:1\u201311. https:\/\/doi.org\/10.1016\/j.neucom.2020.05.027","journal-title":"Neurocomputing"},{"issue":"2","key":"13153_CR98","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu L et al (2020, Springer US) Deep Learning for Generic Object Detection: A Survey. Int J Comput Vis 128(2):261\u2013318. https:\/\/doi.org\/10.1007\/s11263-019-01247-4","journal-title":"Int J Comput Vis"},{"issue":"1","key":"13153_CR99","doi-asserted-by":"publisher","first-page":"270","DOI":"10.1080\/01431161.2021.2018146","volume":"43","author":"Y Liu","year":"2022","unstructured":"Liu Y, Liu J, Ning X, Li J (2022, Taylor & Francis) MS-CNN: multiscale recognition of building rooftops from high spatial resolution remote sensing imagery. Int J Remote Sens 43(1):270\u2013298. https:\/\/doi.org\/10.1080\/01431161.2021.2018146","journal-title":"Int J Remote Sens"},{"issue":"3","key":"13153_CR100","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1007\/s41095-018-0116-x","volume":"4","author":"Y Lu","year":"2018","unstructured":"Lu Y, Lu J, Zhang S, Hall P (2018, Springer) Traffic signal detection and classification in street views using an attention model. Comput Vis Media 4(3):253\u2013266. https:\/\/doi.org\/10.1007\/s41095-018-0116-x","journal-title":"Comput Vis Media"},{"key":"13153_CR101","doi-asserted-by":"publisher","unstructured":"Lu W, Zhou Y, Wan G, Hou S, Song S (2019) L3-Net: Towards Learning Based LiDAR Localization for Autonomous Driving, in 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, vol. 2019-June, 6382\u20136391, https:\/\/doi.org\/10.1109\/CVPR.2019.00655","DOI":"10.1109\/CVPR.2019.00655"},{"key":"13153_CR102","doi-asserted-by":"publisher","unstructured":"Lu X, Ji J, Xing Z, Miao Q (2021) Attention and feature fusion SSD for remote sensing object detection. IEEE Trans Instrum Meas 70, https:\/\/doi.org\/10.1109\/TIM.2021.3052575","DOI":"10.1109\/TIM.2021.3052575"},{"key":"13153_CR103","doi-asserted-by":"publisher","unstructured":"Lucas SM (2005) ICDAR 2005 text locating competition results, in Eighth International Conference on Document Analysis and Recognition (ICDAR\u201905), IEEE, vol. 2005, pp. 80\u201384 Vol. 1, https:\/\/doi.org\/10.1109\/ICDAR.2005.231.","DOI":"10.1109\/ICDAR.2005.231"},{"key":"13153_CR104","doi-asserted-by":"publisher","unstructured":"Lucas SM, Panaretos A, Sosa L, Tang A, Wong S, Young R (2003) ICDAR 2003 robust reading competitions, in Seventh International Conference on Document Analysis and Recognition, 2003. Proceedings., IEEE, vol. 1, 682\u2013687, https:\/\/doi.org\/10.1109\/ICDAR.2003.1227749","DOI":"10.1109\/ICDAR.2003.1227749"},{"key":"13153_CR105","doi-asserted-by":"publisher","unstructured":"Lux M (2009) Caliph & Emir: MPEG-7 photo annotation and retrieval, MM\u201909 - Proc. 2009 ACM Multimed. Conf. with Co-located Work. Symp 925\u2013926, https:\/\/doi.org\/10.1145\/1631272.1631456","DOI":"10.1145\/1631272.1631456"},{"key":"13153_CR106","doi-asserted-by":"publisher","unstructured":"Lv X, Su M, Wang Z (2021) Application of face recognition method under deep learning algorithm in embedded systems. Microprocess. Microsyst, 104034, Elsevier B.V., https:\/\/doi.org\/10.1016\/j.micpro.2021.104034","DOI":"10.1016\/j.micpro.2021.104034"},{"key":"13153_CR107","doi-asserted-by":"publisher","first-page":"107684","DOI":"10.1016\/j.patcog.2020.107684","volume":"111","author":"C Ma","year":"2021","unstructured":"Ma C, Sun L, Zhong Z, Huo Q (2021) ReLaText: exploiting visual relationships for arbitrary-shaped scene text detection with graph convolutional networks. Pattern Recogn 111:107684. https:\/\/doi.org\/10.1016\/j.patcog.2020.107684","journal-title":"Pattern Recogn"},{"key":"13153_CR108","doi-asserted-by":"publisher","unstructured":"Madani M, Bagheri M, Sahba R, Sahba A (2011) Real time object detection using a novel adaptive color thresholding method, MM\u201911 - Proc. 2011 ACM Multimed. Conf. Co-Located Work. - Ubi-MUI 2011 Work. Ubi-MUI\u201911, pp. 13\u201316, https:\/\/doi.org\/10.1145\/2072652.2072656","DOI":"10.1145\/2072652.2072656"},{"issue":"1","key":"13153_CR109","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1111\/mice.12561","volume":"36","author":"H Maeda","year":"2021","unstructured":"Maeda H, Kashiyama T, Sekimoto Y, Seto T, Omata H (2021, wiley) Generative adversarial network for road damage detection. Comput Civ Infrastruct Eng 36(1):1\u201314. https:\/\/doi.org\/10.1111\/mice.12561","journal-title":"Comput Civ Infrastruct Eng"},{"key":"13153_CR110","unstructured":"Manikandan NS, Ganesan K (2019) Deep learning based automatic video annotation tool for self-driving car, [Online]. Available: http:\/\/arxiv.org\/abs\/1904.12618"},{"key":"13153_CR111","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-981-16-1781-2_1","volume":"216","author":"KL Masita","year":"2022","unstructured":"Masita KL, Hasan AN, Shongwe T (2022) Refining the efficiency of R-CNN in Pedestrian Detection. Lecture Notes in Networks and Systems 216:1\u201314","journal-title":"Lecture Notes in Networks and Systems"},{"key":"13153_CR112","doi-asserted-by":"publisher","unstructured":"Mathias M, Timofte R, Benenson R, Van Gool L (2013) Traffic sign recognition - how far are we from the solution?, Proc Int Jt Conf Neural Networks, https:\/\/doi.org\/10.1109\/IJCNN.2013.6707049","DOI":"10.1109\/IJCNN.2013.6707049"},{"key":"13153_CR113","doi-asserted-by":"publisher","unstructured":"Maze B et al. (2018) IARPA Janus Benchmark - C: Face Dataset and Protocol, in 2018 International Conference on Biometrics (ICB), IEEE, pp. 158\u2013165, https:\/\/doi.org\/10.1109\/ICB2018.2018.00033","DOI":"10.1109\/ICB2018.2018.00033"},{"key":"13153_CR114","doi-asserted-by":"publisher","unstructured":"Mehedi Shamrat FMJ, Al Jubair M, Billah MM, Chakraborty S, Alauddin M, Ranjan R (2021) A Deep Learning Approach for Face Detection using Max Pooling, in 2021 5th International Conference on Trends in Electronics and Informatics (ICOEI), IEEE, no. June, pp 760\u2013764, https:\/\/doi.org\/10.1109\/ICOEI51242.2021.9452896","DOI":"10.1109\/ICOEI51242.2021.9452896"},{"key":"13153_CR115","doi-asserted-by":"crossref","unstructured":"Mehta R, Ozturk C (2019) Object Detection at 200 Frames per Second, in Lecture Notes in Computer Science, 11133 LNCS, Springer, Springer, 659\u2013675","DOI":"10.1007\/978-3-030-11021-5_41"},{"issue":"11","key":"13153_CR116","doi-asserted-by":"publisher","first-page":"2874","DOI":"10.1109\/TNNLS.2015.2399233","volume":"26","author":"X Mei","year":"2015","unstructured":"Mei X, Hong Z, Prokhorov D, Tao D (2015, IEEE) Robust multitask multiview tracking in videos. IEEE Trans Neural Networks Learn Syst 26(11):2874\u20132890. https:\/\/doi.org\/10.1109\/TNNLS.2015.2399233","journal-title":"IEEE Trans Neural Networks Learn Syst"},{"issue":"11","key":"13153_CR117","doi-asserted-by":"publisher","first-page":"7977","DOI":"10.1007\/s00500-019-04083-3","volume":"24","author":"P Melnyk","year":"2020","unstructured":"Melnyk P, You Z, Li K (2020, Springer Berlin Heidelberg) A high-performance CNN method for offline handwritten Chinese character recognition and visualization. Soft Comput 24(11):7977\u20137987. https:\/\/doi.org\/10.1007\/s00500-019-04083-3","journal-title":"Soft Comput"},{"issue":"9","key":"13153_CR118","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1016\/j.ifacol.2019.08.128","volume":"52","author":"IY Merkulova","year":"2019","unstructured":"Merkulova IY, Shavetov SV, Borisov OI, Gromov VS (2019, Elsevier Ltd) Object detection and tracking basics: Student education. IFAC-PapersOnLine 52(9):79\u201384. https:\/\/doi.org\/10.1016\/j.ifacol.2019.08.128","journal-title":"IFAC-PapersOnLine"},{"key":"13153_CR119","doi-asserted-by":"publisher","unstructured":"Mishra A, Alahari K, Jawahar C (2012) Scene Text Recognition using Higher Order Language Priors, in Procedings of the British Machine Vision Conference 2012, British Machine Vision Association, pp. 127.1\u2013127.11, https:\/\/doi.org\/10.5244\/C.26.127","DOI":"10.5244\/C.26.127"},{"issue":"4","key":"13153_CR120","doi-asserted-by":"publisher","first-page":"1484","DOI":"10.1109\/TITS.2012.2209421","volume":"13","author":"A Mogelmose","year":"2012","unstructured":"Mogelmose A, Trivedi MM, Moeslund TB (2012) Vision-based traffic sign detection and analysis for intelligent driver assistance systems: perspectives and survey. IEEE Trans Intell Transp Syst 13(4):1484\u20131497. https:\/\/doi.org\/10.1109\/TITS.2012.2209421","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"13153_CR121","doi-asserted-by":"publisher","unstructured":"Murdock M, Reid S, Hamilton B, Reese J (2015) ICDAR 2015 competition on text line detection in historical documents, in 2015 13th International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 1171\u20131175, https:\/\/doi.org\/10.1109\/ICDAR.2015.7333945","DOI":"10.1109\/ICDAR.2015.7333945"},{"key":"13153_CR122","doi-asserted-by":"publisher","unstructured":"Nada H, Sindagi VA, Zhang H, Patel VM (2018) Pushing the Limits of Unconstrained Face Detection: a Challenge Dataset and Baseline Results, in 2018 IEEE 9th International Conference on Biometrics Theory, Applications and Systems (BTAS), IEEE, pp. 1\u201310, https:\/\/doi.org\/10.1109\/BTAS.2018.8698561","DOI":"10.1109\/BTAS.2018.8698561"},{"issue":"2020","key":"13153_CR123","doi-asserted-by":"publisher","first-page":"114549","DOI":"10.1016\/j.eswa.2020.114549","volume":"170","author":"F Naiemi","year":"2021","unstructured":"Naiemi F, Ghods V, Khalesi H (2021, Elsevier Ltd) A novel pipeline framework for multi oriented scene text image detection and recognition. Expert Syst Appl 170(2020):114549. https:\/\/doi.org\/10.1016\/j.eswa.2020.114549","journal-title":"Expert Syst Appl"},{"issue":"9","key":"13153_CR124","first-page":"8290","volume":"10","author":"M Nayagam","year":"2015","unstructured":"Nayagam M, Ramar K (2015) A survey on real time object detection and tracking algorithms. International Journal of Applied Engineering Research 10(9):8290\u20138297","journal-title":"International Journal of Applied Engineering Research"},{"issue":"2","key":"13153_CR125","doi-asserted-by":"publisher","first-page":"464","DOI":"10.3390\/s22020464","volume":"22","author":"U Nepal","year":"2022","unstructured":"Nepal U, Eslamiat H (2022) Comparing YOLOv3, YOLOv4 and YOLOv5 for Autonomous Landing Spot Detection in Faulty UAVs. Sensors 22(2):464. https:\/\/doi.org\/10.3390\/s22020464","journal-title":"Sensors"},{"key":"13153_CR126","doi-asserted-by":"crossref","unstructured":"Neumann L et al. (2019) NightOwls: A Pedestrians at Night Dataset\u201d, in Computer Vision \u2013 ACCV 2018, vol. 11361, H. Li, G. Mori, and K. Schindler, Eds. Springer International Publishing, Springer International Publishing, pp. 691\u2013705","DOI":"10.1007\/978-3-030-20887-5_43"},{"issue":"2","key":"13153_CR127","doi-asserted-by":"publisher","first-page":"135","DOI":"10.15625\/1813-9663\/35\/2\/13315","volume":"35","author":"CC Nguyen","year":"2019","unstructured":"Nguyen CC, Tran GS, Nghiem TP, Burie J-C, Luong CM (2019) Real-time smile detection using deep learning. J Comput Sci Cybern 35(2):135\u2013145. https:\/\/doi.org\/10.15625\/1813-9663\/35\/2\/13315","journal-title":"J Comput Sci Cybern"},{"key":"13153_CR128","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2020\/3189691","volume":"2020","author":"N-D Nguyen","year":"2020","unstructured":"Nguyen N-D, Do T, Ngo TD, Le D-D (2020) An evaluation of deep learning methods for small object detection. J Electr Comput Eng 2020:1\u201318. https:\/\/doi.org\/10.1155\/2020\/3189691","journal-title":"J Electr Comput Eng"},{"issue":"10","key":"13153_CR129","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1002\/ecj.12268","volume":"103","author":"R Ogura","year":"2020","unstructured":"Ogura R, Nagasaki T, Matsubara H (2020) Improving the visibility of nighttime images for pedestrian recognition using in-vehicle camera. Electron Commun Japan 103(10):35\u201343. https:\/\/doi.org\/10.1002\/ecj.12268","journal-title":"Electron Commun Japan"},{"key":"13153_CR130","doi-asserted-by":"publisher","unstructured":"Padilla R, Netto SL, da Silva EABB (2020) A Survey on Performance Metrics for Object-Detection Algorithms\u201d, in 2020 International Conference on Systems, Signals and Image Processing (IWSSIP), IEEE, vol. 2020-July, 237\u2013242, https:\/\/doi.org\/10.1109\/IWSSIP48289.2020.9145130","DOI":"10.1109\/IWSSIP48289.2020.9145130"},{"issue":"1","key":"13153_CR131","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1023\/A:1008162616689","volume":"38","author":"C Papageorgiou","year":"2000","unstructured":"Papageorgiou C, Poggio T (2000, Springer) Trainable system for object detection. Int J Comput Vis 38(1):15\u201333. https:\/\/doi.org\/10.1023\/A:1008162616689","journal-title":"Int J Comput Vis"},{"issue":"04","key":"13153_CR132","first-page":"231","volume":"06","author":"T Pattewar","year":"2019","unstructured":"Pattewar T, Chaudhari A, Marathe M, Bhol M (2019) Real-time object detection : a survey. Int Res J Eng Technol 06(04):231\u2013237","journal-title":"Int Res J Eng Technol"},{"key":"13153_CR133","first-page":"1","volume":"57","author":"V Paul","year":"2001","unstructured":"Paul V, Michael J (2001) Robust real-time object detection. Int J Comput Vis 57:1\u201325","journal-title":"Int J Comput Vis"},{"key":"13153_CR134","unstructured":"Qian R, Lai X, Li X (2021) 3D object detection for autonomous driving: A Survey 14(8), 1\u201324, [Online]. Available: http:\/\/arxiv.org\/abs\/2106.10823"},{"key":"13153_CR135","doi-asserted-by":"publisher","unstructured":"Qin S, Liu S (2021) Towards end-to-end car license plate location and recognition in unconstrained scenarios. Neural Comput Appl, pp. 1\u201311, Springer, https:\/\/doi.org\/10.1007\/s00521-021-06147-8","DOI":"10.1007\/s00521-021-06147-8"},{"key":"13153_CR136","doi-asserted-by":"crossref","unstructured":"Rahman MM, Al Mamun S, Kaiser MS, Islam MS, Rahman MA (2021) Cascade classification of face liveliness detection using heart beat measurement, in Advances in Intelligent Systems and Computing, vol. 1309, Springer, Springer, pp. 581\u2013590","DOI":"10.1007\/978-981-33-4673-4_47"},{"key":"13153_CR137","doi-asserted-by":"crossref","unstructured":"Ravishankar V, Vinod V, Kumar T, Bhalla K (2022) Sensor integration and facial recognition deployment in a smart home system, Springer, Springer, pp. 759\u2013771","DOI":"10.1007\/978-981-16-6407-6_65"},{"key":"13153_CR138","doi-asserted-by":"publisher","unstructured":"Razakarivony S, Jurie F (2016) Vehicle detection in aerial imagery : a small target detection benchmark. J Vis Commun Image Represent 34, 187\u2013203, Elsevier, https:\/\/doi.org\/10.1016\/j.jvcir.2015.11.002","DOI":"10.1016\/j.jvcir.2015.11.002"},{"key":"13153_CR139","doi-asserted-by":"publisher","unstructured":"Redmon J, Farhadi A (2017) YOLO9000: Better, Faster, Stronger, in 2017 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, pp. 6517\u20136525, https:\/\/doi.org\/10.1109\/CVPR.2017.690.","DOI":"10.1109\/CVPR.2017.690"},{"key":"13153_CR140","unstructured":"Redmon J, Farhadi A (2018) YOLOv3: An Incremental Improvement, Comput Vis Pattern Recognit, 1\u20136, arXiv preprint arXiv:1804.02767, [Online]. Available: http:\/\/arxiv.org\/abs\/1804.02767"},{"key":"13153_CR141","doi-asserted-by":"publisher","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: Unified, Real-Time Object Detection, in 2016 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, 779\u2013788, https:\/\/doi.org\/10.1109\/CVPR.2016.91","DOI":"10.1109\/CVPR.2016.91"},{"issue":"6","key":"13153_CR142","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster R-CNN: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149. https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"18","key":"13153_CR143","doi-asserted-by":"publisher","first-page":"8027","DOI":"10.1016\/j.eswa.2014.07.008","volume":"41","author":"A Risnumawan","year":"2014","unstructured":"Risnumawan A, Shivakumara P, Chan CS, Tan CL (2014) A robust arbitrary text detection system for natural scene images. Expert Syst Appl 41(18):8027\u20138048, Elsevier. https:\/\/doi.org\/10.1016\/j.eswa.2014.07.008","journal-title":"Expert Syst Appl"},{"issue":"3","key":"13153_CR144","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky O, Deng J, Su H, Krause J, Satheesh S, Ma S, Huang Z, Karpathy A, Khosla A, Bernstein M, Berg AC, Fei-Fei L (2015) ImageNet large scale visual recognition challenge. Int J Comput Vis 115(3):211\u2013252. https:\/\/doi.org\/10.1007\/s11263-015-0816-y","journal-title":"Int J Comput Vis"},{"issue":"1\u20133","key":"13153_CR145","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1007\/s11263-007-0090-8","volume":"77","author":"BC Russell","year":"2008","unstructured":"Russell BC, Torralba A, Murphy KP, Freeman WT (2008) LabelMe: a database and web-based tool for image annotation. Int J Comput Vis 77(1\u20133):157\u2013173. https:\/\/doi.org\/10.1007\/s11263-007-0090-8","journal-title":"Int J Comput Vis"},{"key":"13153_CR146","doi-asserted-by":"publisher","first-page":"165818","DOI":"10.1016\/j.ijleo.2020.165818","volume":"225","author":"SJ S","year":"2021","unstructured":"S SJ, P ER (2021, Elsevier GmbH) LittleYOLO-SPP: A delicate real-time vehicle detection algorithm. Optik (Stuttg) 225:165818. https:\/\/doi.org\/10.1016\/j.ijleo.2020.165818","journal-title":"Optik (Stuttg)"},{"key":"13153_CR147","unstructured":"Saathoff C, Schenk S, Scherb A (2008) KAT : the K-space annotation tool. Proccedings SAMT, 1\u20132"},{"issue":"2019","key":"13153_CR148","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1016\/j.procs.2020.04.022","volume":"171","author":"NGS Sai Srinath","year":"2020","unstructured":"Sai Srinath NGS, Joseph AZ, Umamaheswaran S, Priyanka CL, Malavika Nair M, Sankaran P (2020, Elsevier BV) NITCAD - Developing an object detection, classification and stereo vision dataset for autonomous navigation in Indian roads. Procedia Comput Sci 171(2019):207\u2013216. https:\/\/doi.org\/10.1016\/j.procs.2020.04.022","journal-title":"Procedia Comput Sci"},{"key":"13153_CR149","doi-asserted-by":"publisher","unstructured":"Sanchez JA, Toselli AH, Romero V, Vidal E (2015) ICDAR 2015 competition HTRtS: Handwritten Text Recognition on the tranScriptorium dataset, in 2015 13th International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 1166\u20131170, https:\/\/doi.org\/10.1109\/ICDAR.2015.7333944.","DOI":"10.1109\/ICDAR.2015.7333944"},{"key":"13153_CR150","doi-asserted-by":"publisher","unstructured":"Sanchez JA, Romero V, Toselli AH, Villegas M, Vidal E (2017) ICDAR2017 Competition on Handwritten Text Recognition on the READ Dataset, in 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 1383\u20131388, https:\/\/doi.org\/10.1109\/ICDAR.2017.226.","DOI":"10.1109\/ICDAR.2017.226"},{"key":"13153_CR151","doi-asserted-by":"publisher","unstructured":"Santra S, Roy S, Sardar P, Deyasi A (2019) Real-time vehicle detection from captured images, 2019 Int. Conf. Opto-electronics. Appl Opt Optronix 2019, 1\u20134, IEEE, https:\/\/doi.org\/10.1109\/OPTRONIX.2019.8862323","DOI":"10.1109\/OPTRONIX.2019.8862323"},{"key":"13153_CR152","doi-asserted-by":"publisher","unstructured":"Sch\u00f6ller FET, Plenge-Feidenhans\u2019L MK, Stets JD, Blanke M (2019) Assessing deep-learning methods for object detection at sea from LWIR images, in IFAC-PapersOnLine, Elsevier Ltd, 52(21), 64\u201371, https:\/\/doi.org\/10.1016\/j.ifacol.2019.12.284","DOI":"10.1016\/j.ifacol.2019.12.284"},{"key":"13153_CR153","doi-asserted-by":"publisher","first-page":"505","DOI":"10.1007\/978-981-16-2937-2_32","volume":"71","author":"S Setta","year":"2022","unstructured":"Setta S, Sinha S, Mishra M, Choudhury P (2022) Real-time facial recognition using SURF-FAST. Lecture Notes on Data Engineering and Communications Technologies 71:505\u2013522","journal-title":"Lecture Notes on Data Engineering and Communications Technologies"},{"key":"13153_CR154","doi-asserted-by":"publisher","unstructured":"Shahab A, Shafait F, Dengel A (2011) ICDAR 2011 Robust Reading Competition Challenge 2: Reading Text in Scene Images, in 2011 International Conference on Document Analysis and Recognition, IEEE, pp. 1491\u20131496, https:\/\/doi.org\/10.1109\/ICDAR.2011.296","DOI":"10.1109\/ICDAR.2011.296"},{"key":"13153_CR155","doi-asserted-by":"publisher","unstructured":"Shao S et al. (2019) Objects365: A Large-Scale, High-Quality Dataset for Object Detection, in 2019 IEEE\/CVF International Conference on Computer Vision (ICCV), IEEE, pp. 8429\u20138438, https:\/\/doi.org\/10.1109\/ICCV.2019.00852","DOI":"10.1109\/ICCV.2019.00852"},{"key":"13153_CR156","doi-asserted-by":"publisher","unstructured":"Shao Z, Cheng G, Ma J, Wang Z, Wang J, Li D (2021) Real-time and accurate UAV pedestrian detection for social distancing monitoring in COVID-19 pandemic. IEEE Trans Multimed, pp. 1\u20131, https:\/\/doi.org\/10.1109\/TMM.2021.3075566.","DOI":"10.1109\/TMM.2021.3075566"},{"key":"13153_CR157","doi-asserted-by":"publisher","unstructured":"Sharma N, Mandal R, Sharma R, Pal U, Blumenstein M (2015) ICDAR2015 Competition on Video Script Identification (CVSI 2015), in 2015 13th International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 1196\u20131200, https:\/\/doi.org\/10.1109\/ICDAR.2015.7333950","DOI":"10.1109\/ICDAR.2015.7333950"},{"key":"13153_CR158","doi-asserted-by":"publisher","unstructured":"Shashirangana J et al (2021, wiley) License plate recognition using neural architecture search for edge devices. Int J Intell Syst:1\u201338. https:\/\/doi.org\/10.1002\/int.22471","DOI":"10.1002\/int.22471"},{"key":"13153_CR159","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.jvcir.2019.102740","volume":"70","author":"Y Shi","year":"2020","unstructured":"Shi Y, Zhang Z, Huang K, Ma W, Tu S (2020, Elsevier Inc) Human-computer interaction based on face feature localization. J vis Commun Image represent 70:1\u20136. https:\/\/doi.org\/10.1016\/j.jvcir.2019.102740","journal-title":"J vis Commun Image represent"},{"key":"13153_CR160","doi-asserted-by":"publisher","unstructured":"Song X et al. (2019) APOLLOCAR3D: a large 3D car instance understanding benchmark for autonomous driving, Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit vol. 2019-June, pp. 5447\u20135457, IEEE, https:\/\/doi.org\/10.1109\/CVPR.2019.00560","DOI":"10.1109\/CVPR.2019.00560"},{"issue":"22","key":"13153_CR161","doi-asserted-by":"publisher","first-page":"17417","DOI":"10.1007\/s00500-020-05042-z","volume":"24","author":"D Sudha","year":"2020","unstructured":"Sudha D, Priyadarshini J (2020, Springer Berlin Heidelberg) An intelligent multiple vehicle detection and tracking using modified vibe algorithm and deep learning algorithm. Soft Comput 24(22):17417\u201317429. https:\/\/doi.org\/10.1007\/s00500-020-05042-z","journal-title":"Soft Comput"},{"key":"13153_CR162","doi-asserted-by":"publisher","unstructured":"Sun Y et al. (2019) ICDAR 2019 Competition on Large-Scale Street View Text with Partial Labeling - RRC-LSVT, in 2019 International Conference on Document Analysis and Recognition (ICDAR), IEEE, pp. 1557\u20131562, https:\/\/doi.org\/10.1109\/ICDAR.2019.00250","DOI":"10.1109\/ICDAR.2019.00250"},{"key":"13153_CR163","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.imavis.2020.104036","volume":"103","author":"P Sun","year":"2020","unstructured":"Sun P, Zheng Y, Zhou Z, Xu W, Ren Q (2020, Elsevier B.V) R4 Det: refined single-stage detector with feature recursion and refinement for rotating object detection in aerial images. Image Vis Comput 103:1\u201326. https:\/\/doi.org\/10.1016\/j.imavis.2020.104036","journal-title":"Image Vis Comput"},{"issue":"1","key":"13153_CR164","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1080\/22797254.2021.1880975","volume":"54","author":"F Sun","year":"2021","unstructured":"Sun F, Li H, Liu Z, Li X, Wu Z (2021, Taylor & Francis) Arbitrary-angle bounding box based location for object detection in remote sensing image. Eur J Remote Sens 54(1):102\u2013116. https:\/\/doi.org\/10.1080\/22797254.2021.1880975","journal-title":"Eur J Remote Sens"},{"key":"13153_CR165","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1016\/j.isprsjprs.2020.12.015","volume":"173","author":"X Sun","year":"2021","unstructured":"Sun X, Wang P, Wang C, Liu Y, Fu K (2021, Elsevier) PBNet: part-based convolutional neural network for complex composite object detection in remote sensing imagery. ISPRS J Photogramm Remote Sens 173:50\u201365. https:\/\/doi.org\/10.1016\/j.isprsjprs.2020.12.015","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"13153_CR166","doi-asserted-by":"publisher","unstructured":"Susanto ER, Analia R, Sutopo PD, Soebakti H (2017) The deep learning development for real-time ball and goal detection of barelang-FC, in 2017 International Electronics Symposium on Engineering Technology and Applications (IES-ETA), IEEE, pp. 146\u2013151, https:\/\/doi.org\/10.1109\/ELECSYM.2017.8240393.","DOI":"10.1109\/ELECSYM.2017.8240393"},{"issue":"10","key":"13153_CR167","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/tee.23215","volume":"15","author":"T Suzuki","year":"2020","unstructured":"Suzuki T, Kageyama Y, Ishizawa C (2020, wiley) Recognition method for speed limit signs and its applicability in recognition of vehicle entry prohibition signs at night. IEEJ Trans Electr Electron Eng 15(10):1\u20139. https:\/\/doi.org\/10.1002\/tee.23215","journal-title":"IEEJ Trans Electr Electron Eng"},{"issue":"6","key":"13153_CR168","doi-asserted-by":"publisher","first-page":"4307","DOI":"10.1016\/j.aej.2021.09.043","volume":"61","author":"M Tamilselvi","year":"2022","unstructured":"Tamilselvi M, Karthikeyan S (2022, Elsevier) An ingenious face recognition system based on HRPSM_CNN under unrestrained environmental condition. Alexandria Eng J 61(6):4307\u20134321. https:\/\/doi.org\/10.1016\/j.aej.2021.09.043","journal-title":"Alexandria Eng J"},{"key":"13153_CR169","doi-asserted-by":"publisher","unstructured":"Tanner F et al. (2009) Overhead imagery research data set \u2014 an annotated data library & tools to aid in the development of computer vision algorithms, in 2009 IEEE Applied Imagery Pattern Recognition Workshop (AIPR 2009), IEEE, 1\u20138, https:\/\/doi.org\/10.1109\/AIPR.2009.5466304","DOI":"10.1109\/AIPR.2009.5466304"},{"key":"13153_CR170","doi-asserted-by":"publisher","unstructured":"Tarchoun B, Jegham I, Ben Khalifa A, Alouani I, Mahjoub MA (2020) Deep CNN-based Pedestrian Detection for Intelligent Infrastructure, in 2020 5th International Conference on Advanced Technologies for Signal and Image Processing (ATSIP), IEEE, pp. 1\u20136, https:\/\/doi.org\/10.1109\/ATSIP49331.2020.9231712","DOI":"10.1109\/ATSIP49331.2020.9231712"},{"issue":"5","key":"13153_CR171","doi-asserted-by":"publisher","first-page":"416","DOI":"10.1080\/2150704X.2020.1722330","volume":"11","author":"Z Tian","year":"2020","unstructured":"Tian Z, Zhan R, Wang W, He Z, Zhang J, Zhuang Z (2020, Taylor & Francis) Object detection in optical remote sensing images by integrating object-to-object relationships. Remote Sens Lett 11(5):416\u2013425. https:\/\/doi.org\/10.1080\/2150704X.2020.1722330","journal-title":"Remote Sens Lett"},{"key":"13153_CR172","doi-asserted-by":"publisher","unstructured":"Timofte R, Zimmermann K, Van Gool L (2014) Multi-view traffic sign detection, recognition, and 3D localisation, in Machine Vision and Applications, Springer, 25(3), 633\u2013647, https:\/\/doi.org\/10.1007\/s00138-011-0391-3","DOI":"10.1007\/s00138-011-0391-3"},{"key":"13153_CR173","doi-asserted-by":"publisher","unstructured":"Tousch A-M, Herbin S, Audibert J-Y (2012) Semantic hierarchies for image annotation: A survey, in pattern recognition, Elsevier, 45(1), 333\u2013345, https:\/\/doi.org\/10.1016\/j.patcog.2011.05.017","DOI":"10.1016\/j.patcog.2011.05.017"},{"key":"13153_CR174","doi-asserted-by":"crossref","unstructured":"Tran P, Pattichis M, Celed\u00f3n-Pattichis S, L\u00f3pezLeiva C (2021) Facial recognition in collaborative learning videos, in Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), vol. 13053, no. 1613637, Springer, Springer, pp. 252\u2013261","DOI":"10.1007\/978-3-030-89131-2_23"},{"key":"13153_CR175","unstructured":"Tzutalin (2015) Labelimg, https:\/\/github.com\/tzutalin\/label."},{"issue":"2","key":"13153_CR176","doi-asserted-by":"publisher","first-page":"721","DOI":"10.1007\/s12652-020-02845-8","volume":"13","author":"S Umer","year":"2022","unstructured":"Umer S, Rout RK, Pero C, Nappi M (2022, Springer) Facial expression recognition with trade-offs between data augmentation and deep learning features. J Ambient Intell Humaniz Comput 13(2):721\u2013735. https:\/\/doi.org\/10.1007\/s12652-020-02845-8","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"13153_CR177","doi-asserted-by":"publisher","unstructured":"Varma S, Sreeraj M (2013) Object detection and classification in surveillance system, in 2013 IEEE Recent Advances in Intelligent Computational Systems (RAICS), IEEE, 299\u2013303, https:\/\/doi.org\/10.1109\/RAICS.2013.6745491","DOI":"10.1109\/RAICS.2013.6745491"},{"key":"13153_CR178","unstructured":"Veit A, Matera T, Neumann L, Matas J, Belongie S (2016) COCO-Text: Dataset and Benchmark for Text Detection and Recognition in Natural Images, [Online]. Available: http:\/\/arxiv.org\/abs\/1601.07140."},{"key":"13153_CR179","doi-asserted-by":"publisher","unstructured":"Vennelakanti A, Shreya S, Rajendran R, Sarkar D, Muddegowda D, Hanagal P (2019) Traffic Sign Detection and Recognition using a CNN Ensemble, in 2019 IEEE International Conference on Consumer Electronics (ICCE), IEEE, pp. 1\u20134, https:\/\/doi.org\/10.1109\/ICCE.2019.8662019","DOI":"10.1109\/ICCE.2019.8662019"},{"key":"13153_CR180","doi-asserted-by":"publisher","unstructured":"Viola P, Jones M (2001) Rapid object detection using a boosted cascade of simple features, in Proceedings of the 2001 IEEE Computer Society Conference on Computer Vision and Pattern Recognition. CVPR 2001, IEEE Comput. Soc, pp I-511-I\u2013518, https:\/\/doi.org\/10.1109\/CVPR.2001.990517","DOI":"10.1109\/CVPR.2001.990517"},{"issue":"2","key":"13153_CR181","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1023\/B:VISI.0000013087.49260.fb","volume":"57","author":"P Viola","year":"2003","unstructured":"Viola P, Jones MJ (2003, Springer) Robust real-time face detection. Int J Comput Vis 57(2):137\u2013154. https:\/\/doi.org\/10.1023\/B:VISI.0000013087.49260.fb","journal-title":"Int J Comput Vis"},{"key":"13153_CR182","unstructured":"VoTT: Vott (visual object tagging tool) (2019) https:\/\/github.com\/microsoft\/VoTT\/blob\/master\/README.md."},{"key":"13153_CR183","doi-asserted-by":"crossref","unstructured":"Wang K, Belongie S (2010) Word Spotting in the Wild, in 11th European Conference on Computer Vision, Springer, Springer, 591\u2013604","DOI":"10.1007\/978-3-642-15549-9_43"},{"issue":"1","key":"13153_CR184","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1080\/22797254.2021.2018944","volume":"55","author":"H Wang","year":"2022","unstructured":"Wang H, Miao F (2022, Taylor & Francis) Building extraction from remote sensing images using deep residual U-Net. Eur J Remote Sens 55(1):71\u201385. https:\/\/doi.org\/10.1080\/22797254.2021.2018944","journal-title":"Eur J Remote Sens"},{"issue":"1","key":"13153_CR185","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1109\/TPAMI.2017.2662005","volume":"40","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Yang R, Porikli F (2018, IEEE) A unified spatiotemporal prior based on geodesic distance for video object segmentation. IEEE Trans Pattern Anal Mach Intell 40(1):20\u201333. https:\/\/doi.org\/10.1109\/TPAMI.2017.2662005","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13153_CR186","doi-asserted-by":"publisher","unstructured":"Wang J, Jiang S, Song W, Yang Y (2019) A Comparative Study of Small Object Detection Algorithms, in 2019 Chinese Control Conference (CCC), IEEE, vol. 2019-July, pp. 8507\u20138512, https:\/\/doi.org\/10.23919\/ChiCC.2019.8865157","DOI":"10.23919\/ChiCC.2019.8865157"},{"key":"13153_CR187","doi-asserted-by":"publisher","unstructured":"Wang Y, Xie H, Zha Z, Xing M, Fu Z, Zhang Y (2020) ContourNet: Taking a Further Step Toward Accurate Arbitrary-Shaped Scene Text Detection, in 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, pp. 11753\u201311762, https:\/\/doi.org\/10.1109\/CVPR42600.2020.01177","DOI":"10.1109\/CVPR42600.2020.01177"},{"issue":"c","key":"13153_CR188","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2021.3064599","volume":"60","author":"G Wang","year":"2022","unstructured":"Wang G, Zhuang Y, Chen H, Liu X, Zhang T, Li L, Dong S, Sang Q (2022) FSoD-net: full-scale object detection from optical remote sensing imagery. IEEE Trans Geosci Remote Sens 60(c):1\u201318. https:\/\/doi.org\/10.1109\/TGRS.2021.3064599","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"13153_CR189","doi-asserted-by":"publisher","first-page":"107195","DOI":"10.1016\/j.patcog.2020.107195","volume":"103","author":"X Wei","year":"2020","unstructured":"Wei X, Zhang H, Liu S, Lu Y (2020, Elsevier Ltd) Pedestrian detection in underground mines via parallel feature transfer network. Pattern Recognit 103:107195. https:\/\/doi.org\/10.1016\/j.patcog.2020.107195","journal-title":"Pattern Recognit"},{"key":"13153_CR190","doi-asserted-by":"publisher","unstructured":"Womg A, Shafiee MJ, Li F, Chwyl B (2018) Tiny SSD: A Tiny Single-Shot Detection Deep Convolutional Neural Network for Real-Time Embedded Object Detection, in 2018 15th conference on computer and robot vision (CRV), IEEE, 95\u2013101, https:\/\/doi.org\/10.1109\/CRV.2018.00023.","DOI":"10.1109\/CRV.2018.00023"},{"key":"13153_CR191","doi-asserted-by":"publisher","unstructured":"Wu S, Zhang L (2018) Using popular object detection methods for real time forest fire detection, in 2018 11th International Symposium on Computational Intelligence and Design (ISCID), IEEE, pp. 280\u2013284, https:\/\/doi.org\/10.1109\/ISCID.2018.00070","DOI":"10.1109\/ISCID.2018.00070"},{"key":"13153_CR192","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1016\/j.neucom.2020.01.085","volume":"396","author":"X Wu","year":"2020","unstructured":"Wu X, Sahoo D, Hoi SCH (2020, Elsevier B.V.) Recent advances in deep learning for object detection. Neurocomputing 396:39\u201364. https:\/\/doi.org\/10.1016\/j.neucom.2020.01.085","journal-title":"Neurocomputing"},{"key":"13153_CR193","doi-asserted-by":"publisher","unstructured":"Wu J, Zhou C, Zhang Q, Yang M, Yuan J (2020) Self-mimic learning for small-scale pedestrian detection, in Proceedings of the 28th ACM International Conference on Multimedia, ACM, pp. 1\u20139, https:\/\/doi.org\/10.1145\/3394171.3413634","DOI":"10.1145\/3394171.3413634"},{"key":"13153_CR194","doi-asserted-by":"publisher","first-page":"113889","DOI":"10.1109\/ACCESS.2021.3103522","volume":"9","author":"K Wu","year":"2021","unstructured":"Wu K, Bai C, Wang D, Liu Z, Huang T, Zheng H (2021, IEEE) Improved object detection algorithm of YOLOv3 remote sensing image. IEEE Access 9:113889\u2013113900. https:\/\/doi.org\/10.1109\/ACCESS.2021.3103522","journal-title":"IEEE Access"},{"issue":"108214","key":"13153_CR195","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patcog.2021.108214","volume":"122","author":"J Wu","year":"2022","unstructured":"Wu J et al (2022, Elsevier) A multimodal attention fusion network with a dynamic vocabulary for TextVQA. Pattern Recognit 122(108214):1\u201310. https:\/\/doi.org\/10.1016\/j.patcog.2021.108214","journal-title":"Pattern Recognit"},{"key":"13153_CR196","doi-asserted-by":"publisher","unstructured":"Xia GS et al. (2018) DOTA: a large-scale dataset for object detection in aerial images, Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit, 3974\u20133983, https:\/\/doi.org\/10.1109\/CVPR.2018.00418","DOI":"10.1109\/CVPR.2018.00418"},{"issue":"33\u201334","key":"13153_CR197","doi-asserted-by":"publisher","first-page":"23729","DOI":"10.1007\/s11042-020-08976-6","volume":"79","author":"Y Xiao","year":"2020","unstructured":"Xiao Y et al (2020) A review of object detection based on deep learning. Multimed. Tools Appl. 79(33\u201334):23729\u201323791. https:\/\/doi.org\/10.1007\/s11042-020-08976-6","journal-title":"Multimed. Tools Appl."},{"key":"13153_CR198","doi-asserted-by":"publisher","unstructured":"Xu H, Guo M, Nedjah N, Zhang J, Li P (2022) Vehicle and pedestrian detection algorithm based on lightweight YOLOv3-promote and semi-precision acceleration. IEEE Trans Intell Transp Syst, 1\u201312, https:\/\/doi.org\/10.1109\/TITS.2021.3137253","DOI":"10.1109\/TITS.2021.3137253"},{"key":"13153_CR199","doi-asserted-by":"publisher","first-page":"106675","DOI":"10.1016\/j.compag.2021.106675","volume":"193","author":"B Xu","year":"2022","unstructured":"Xu B et al (2022, Elsevier) CattleFaceNet: a cattle face identification approach based on RetinaFace and ArcFace loss. Comput. Electron Agric. 193:106675. https:\/\/doi.org\/10.1016\/j.compag.2021.106675","journal-title":"Comput. Electron Agric."},{"key":"13153_CR200","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.patcog.2021.108494","volume":"124","author":"C Xue","year":"2022","unstructured":"Xue C, Lu S, Hoi S (2022, Elsevier) Detection and rectification of arbitrary shaped scene texts by using text keypoints and links. Pattern Recognit 124:1\u201331. https:\/\/doi.org\/10.1016\/j.patcog.2021.108494","journal-title":"Pattern Recognit"},{"key":"13153_CR201","doi-asserted-by":"publisher","unstructured":"Yang B, Yan J, Lei Z, Li SZ (2015) Fine-grained evaluation on face detection in the wild, in 2015 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (FG), IEEE, 1\u20137, https:\/\/doi.org\/10.1109\/FG.2015.7163158","DOI":"10.1109\/FG.2015.7163158"},{"key":"13153_CR202","doi-asserted-by":"publisher","unstructured":"Yang S, Luo P, Loy CC, Tang X (2016) WIDER FACE: A Face Detection Benchmark, in 2016 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, 5525\u20135533, https:\/\/doi.org\/10.1109\/CVPR.2016.596.","DOI":"10.1109\/CVPR.2016.596"},{"key":"13153_CR203","doi-asserted-by":"publisher","unstructured":"Yao C, Bai X, Liu W, Ma Y, Zhuowen Tu (2012) Detecting texts of arbitrary orientations in natural images, in 2012 IEEE conference on computer vision and pattern recognition, IEEE, 1083\u20131090, https:\/\/doi.org\/10.1109\/CVPR.2012.6247787.","DOI":"10.1109\/CVPR.2012.6247787"},{"issue":"7","key":"13153_CR204","doi-asserted-by":"publisher","first-page":"1480","DOI":"10.1109\/TPAMI.2014.2366765","volume":"37","author":"Q Ye","year":"2015","unstructured":"Ye Q, Doermann D (Jul. 2015) Text detection and recognition in imagery: a survey. IEEE Trans Pattern Anal Mach Intell 37(7):1480\u20131500. https:\/\/doi.org\/10.1109\/TPAMI.2014.2366765","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13153_CR205","doi-asserted-by":"publisher","unstructured":"Yuan L, Lu F (2018) Real-time ear detection based on embedded systems, in 2018 International Conference on Machine Learning and Cybernetics (ICMLC), IEEE, 115\u2013120, https:\/\/doi.org\/10.1109\/ICMLC.2018.8526987","DOI":"10.1109\/ICMLC.2018.8526987"},{"key":"13153_CR206","unstructured":"Yucel MK, Bilge YC, Oguz O, Ikizler-Cinbis N, Duygulu P, Cinbis RG (2018) Wildest Faces: Face Detection and Recognition in Violent Settings, [Online]. Available: http:\/\/arxiv.org\/abs\/1805.07566"},{"key":"13153_CR207","unstructured":"Yuliang L, Lianwen J, Shuaitao Z, Sheng Z (2017) Detecting curve text in the wild: new dataset and new solution, [Online]. Available: http:\/\/arxiv.org\/abs\/1712.02170."},{"key":"13153_CR208","doi-asserted-by":"publisher","first-page":"1039","DOI":"10.1109\/JSTARS.2022.3140776","volume":"15","author":"Z Zakria","year":"2022","unstructured":"Zakria Z, Deng J, Kumar R, Khokhar MS, Cai J, Kumar J (2022) Multiscale and direction target detecting in remote sensing images via modified YOLO-v4. IEEE J Sel Top Appl Earth Obs Remote Sens 15:1039\u20131048. https:\/\/doi.org\/10.1109\/JSTARS.2022.3140776","journal-title":"IEEE J Sel Top Appl Earth Obs Remote Sens"},{"key":"13153_CR209","doi-asserted-by":"publisher","unstructured":"Zhang H, Hong X (2019) Recent progresses on object detection : a brief review, in Multimedia Tools and Applications, Multimedia Tools and Applications 78, no. June, 27809\u201327847, https:\/\/doi.org\/10.1007\/s11042-019-07898-2.","DOI":"10.1007\/s11042-019-07898-2"},{"issue":"11","key":"13153_CR210","doi-asserted-by":"publisher","first-page":"9682","DOI":"10.1109\/TGRS.2020.3045708","volume":"59","author":"L Zhang","year":"2021","unstructured":"Zhang L, Ma J (2021) Salient object detection based on progressively supervised learning for remote sensing images. IEEE Trans Geosci Remote Sens 59(11):9682\u20139696. https:\/\/doi.org\/10.1109\/TGRS.2020.3045708","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"13153_CR211","doi-asserted-by":"publisher","unstructured":"Zhang S, Benenson R, Schiele B (2017) CityPersons: a diverse dataset for pedestrian detection, in 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), IEEE, pp. 4457\u20134465, https:\/\/doi.org\/10.1109\/CVPR.2017.474","DOI":"10.1109\/CVPR.2017.474"},{"key":"13153_CR212","doi-asserted-by":"publisher","first-page":"29742","DOI":"10.1109\/ACCESS.2020.2972338","volume":"8","author":"J Zhang","year":"2020","unstructured":"Zhang J, Xie Z, Sun J, Zou X, Wang J (2020, IEEE) A cascaded R-CNN with multiscale attention and imbalanced samples for traffic sign detection. IEEE access 8:29742\u201329754. https:\/\/doi.org\/10.1109\/ACCESS.2020.2972338","journal-title":"IEEE access"},{"key":"13153_CR213","doi-asserted-by":"publisher","first-page":"384","DOI":"10.1016\/j.neucom.2021.10.068","volume":"468","author":"X Zhang","year":"2022","unstructured":"Zhang X, Liu Y, Huo C, Xu N, Wang L, Pan C (2022) PSNet: perspective-sensitive convolutional network for object detection. Neurocomputing 468:384\u2013395. https:\/\/doi.org\/10.1016\/j.neucom.2021.10.068","journal-title":"Neurocomputing"},{"issue":"11","key":"13153_CR214","doi-asserted-by":"publisher","first-page":"3212","DOI":"10.1109\/TNNLS.2018.2876865","volume":"30","author":"Z-QQ Zhao","year":"2019","unstructured":"Zhao Z-QQ, Zheng P, Xu S-TT, Wu X (2019, IEEE) Object detection with deep learning: A Review. IEEE Trans. Neural Networks Learn. Syst. 30(11):3212\u20133232. https:\/\/doi.org\/10.1109\/TNNLS.2018.2876865","journal-title":"IEEE Trans. Neural Networks Learn. Syst."},{"issue":"15","key":"13153_CR215","doi-asserted-by":"publisher","first-page":"5764","DOI":"10.1080\/01431161.2021.1931537","volume":"42","author":"X Zhao","year":"2021","unstructured":"Zhao X, Zhang J, Tian J, Zhuo L, Zhang J (2021, Taylor & Francis) Multiscale object detection in high-resolution remote sensing images via rotation invariant deep features driven by channel attention. Int J Remote Sens 42(15):5764\u20135783. https:\/\/doi.org\/10.1080\/01431161.2021.1931537","journal-title":"Int J Remote Sens"},{"key":"13153_CR216","unstructured":"Zhou J, Yuqiao T, Li W, Wang R, Luan Z, Qian D (2019) LADet : A Light-weight and Adaptive Network for Multi-scale Object Detection, in Proceedings of The Eleventh Asian Conference on Machine Learning, 912\u2013923."},{"key":"13153_CR217","doi-asserted-by":"publisher","first-page":"107336","DOI":"10.1016\/j.patcog.2020.107336","volume":"110","author":"Y Zhu","year":"2021","unstructured":"Zhu Y, Du J (2021, Elsevier) TextMountain: accurate scene text detection via instance segmentation. Pattern Recognit 110:107336. https:\/\/doi.org\/10.1016\/j.patcog.2020.107336","journal-title":"Pattern Recognit"},{"key":"13153_CR218","doi-asserted-by":"publisher","first-page":"104023","DOI":"10.1016\/j.imavis.2020.104023","volume":"104","author":"Y Zhu","year":"2020","unstructured":"Zhu Y, Jiang Y (2020, Elsevier BV) Optimization of face recognition algorithm based on deep learning multi feature fusion driven by big data. Image Vis Comput 104:104023. https:\/\/doi.org\/10.1016\/j.imavis.2020.104023","journal-title":"Image Vis Comput"},{"key":"13153_CR219","doi-asserted-by":"publisher","unstructured":"Zhu H, Chen X, Dai W, Fu K, Ye Q, Jiao J (2015) Orientation robust object detection in aerial images using deep convolutional neural network, in 2015 IEEE International Conference on Image Processing (ICIP), IEEE, pp. 3735\u20133739, https:\/\/doi.org\/10.1109\/ICIP.2015.7351502.","DOI":"10.1109\/ICIP.2015.7351502"},{"key":"13153_CR220","doi-asserted-by":"publisher","unstructured":"Zhu Z, Liang D, Zhang S, Huang X, Li B, Hu S (2016) Traffic-sign detection and classification in the wild, in 2016 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, 2110\u20132118, https:\/\/doi.org\/10.1109\/CVPR.2016.232","DOI":"10.1109\/CVPR.2016.232"},{"issue":"3","key":"13153_CR221","doi-asserted-by":"publisher","first-page":"1100","DOI":"10.1109\/TIP.2017.2773199","volume":"27","author":"Z Zou","year":"2018","unstructured":"Zou Z, Shi Z (2018) Random access memories: a new paradigm for target detection in high resolution aerial remote sensing images. IEEE Trans Image Process 27(3):1100\u20131111. https:\/\/doi.org\/10.1109\/TIP.2017.2773199","journal-title":"IEEE Trans Image Process"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13153-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-13153-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13153-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T12:04:50Z","timestamp":1744200290000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-13153-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,4,23]]},"references-count":221,"journal-issue":{"issue":"27","published-print":{"date-parts":[[2022,11]]}},"alternative-id":["13153"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-13153-y","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,4,23]]},"assertion":[{"value":"16 April 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 February 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 April 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 April 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflicts of interest to declare relevant to this article\u2019s content.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}]}}