{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T20:59:34Z","timestamp":1780693174423,"version":"3.54.1"},"reference-count":252,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2020,4,21]],"date-time":"2020-04-21T00:00:00Z","timestamp":1587427200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,4,21]],"date-time":"2020-04-21T00:00:00Z","timestamp":1587427200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s10462-020-09825-6","type":"journal-article","created":{"date-parts":[[2020,4,21]],"date-time":"2020-04-21T09:03:22Z","timestamp":1587459802000},"page":"5455-5516","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2414,"title":["A survey of the recent architectures of deep convolutional neural networks"],"prefix":"10.1007","volume":"53","author":[{"given":"Asifullah","family":"Khan","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Anabia","family":"Sohail","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Umme","family":"Zahoora","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Aqsa Saeed","family":"Qureshi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2020,4,21]]},"reference":[{"key":"9825_CR1","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1007\/s10462-018-9633-3","volume":"52","author":"Q Abbas","year":"2019","unstructured":"Abbas Q, Ibrahim MEA, Jaffar MA (2019) A comprehensive review of recent advances on deep vision systems. Artif Intell Rev 52:39\u201376. https:\/\/doi.org\/10.1007\/s10462-018-9633-3","journal-title":"Artif Intell Rev"},{"key":"9825_CR2","doi-asserted-by":"publisher","unstructured":"Abdel-Hamid O, Mohamed AR, Jiang H, Penn G (2012) Applying convolutional neural networks concepts to hybrid NN-HMM model for speech recognition. In: ICASSP, IEEE international conference on acoustics speech and signal processing, pp 4277\u20134280. https:\/\/doi.org\/10.1007\/978-3-319-96145-3_2","DOI":"10.1007\/978-3-319-96145-3_2"},{"key":"9825_CR3","doi-asserted-by":"crossref","unstructured":"Abdel-Hamid O, Deng L, Yu D (2013) Exploring convolutional neural network structures and optimization techniques for speech recognition. In: Interspeech, pp 1173\u20131175","DOI":"10.21437\/Interspeech.2013-744"},{"key":"9825_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.jsv.2016.10.043","author":"O Abdeljaber","year":"2017","unstructured":"Abdeljaber O, Avci O, Kiranyaz S et al (2017) Real-time vibration-based structural damage detection using one-dimensional convolutional neural networks. J Sound Vib. https:\/\/doi.org\/10.1016\/j.jsv.2016.10.043","journal-title":"J Sound Vib"},{"key":"9825_CR5","unstructured":"Abdulkader A (2006) Two-tier approach for Arabic offline handwriting recognition. In: Tenth international workshop on frontiers in handwriting recognition"},{"key":"9825_CR6","doi-asserted-by":"crossref","unstructured":"Ahmed U, Khan A, Khan SH et al (2019) Transfer learning and meta classification based deep churn prediction system for telecom industry, pp 1\u201310","DOI":"10.14569\/IJACSA.2019.0100918"},{"key":"9825_CR7","doi-asserted-by":"crossref","unstructured":"Akar E, Marques O, Andrews WA, Furht B (2019) Cloud-based skin lesion diagnosis system using convolutional neural networks. In: Intelligent computing-proceedings of the computing conference, pp 982\u20131000","DOI":"10.1007\/978-3-030-22871-2_70"},{"key":"9825_CR8","doi-asserted-by":"publisher","first-page":"527","DOI":"10.1007\/s10462-019-09706-7","volume":"52","author":"M Amer","year":"2019","unstructured":"Amer M, Maul T (2019) A review of modularization techniques in artificial neural networks. Artif Intell Rev 52:527\u2013561. https:\/\/doi.org\/10.1007\/s10462-019-09706-7","journal-title":"Artif Intell Rev"},{"key":"9825_CR9","doi-asserted-by":"publisher","DOI":"10.1088\/1748-0221\/11\/09\/P09001","author":"A Aurisano","year":"2016","unstructured":"Aurisano A, Radovic A, Rocco D et al (2016) A convolutional neural network neutrino event classifier. J Instrum. https:\/\/doi.org\/10.1088\/1748-0221\/11\/09\/P09001","journal-title":"J Instrum"},{"key":"9825_CR253","doi-asserted-by":"crossref","unstructured":"Aziz A, Sohail A, Fahad L, et al (2020) Channel Boosted Convolutional Neural Network for Classification of Mitotic Nuclei using Histopathological Images. In: 2020 17th International Bhurban Conference on Applied Sciences and Technology (IBCAST). pp 277\u2013284","DOI":"10.1109\/IBCAST47879.2020.9044583"},{"key":"9825_CR10","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2644615","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan V, Kendall A, Cipolla R (2017) SegNet: a Deep convolutional encoder-decoder architecture for image segmentation. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2016.2644615","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR11","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10462-018-9654-y","volume":"52","author":"Z Batmaz","year":"2019","unstructured":"Batmaz Z, Yurekli A, Bilge A, Kaleli C (2019) A review on deep learning for recommender systems: challenges and remedies. Artif Intell Rev 52:1\u201337. https:\/\/doi.org\/10.1007\/s10462-018-9654-y","journal-title":"Artif Intell Rev"},{"key":"9825_CR12","doi-asserted-by":"publisher","first-page":"346","DOI":"10.1016\/j.cviu.2007.09.014","volume":"110","author":"H Bay","year":"2008","unstructured":"Bay H, Ess A, Tuytelaars T, Van Gool L (2008) Speeded-up robust features (SURF). Comput Vis Image Underst 110:346\u2013359. https:\/\/doi.org\/10.1016\/j.cviu.2007.09.014","journal-title":"Comput Vis Image Underst"},{"key":"9825_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1561\/2200000006","volume":"2","author":"Y Bengio","year":"2009","unstructured":"Bengio Y (2009) Learning deep architectures for AI. Found Trends\u00ae Mach Learn 2:1\u2013127. https:\/\/doi.org\/10.1561\/2200000006","journal-title":"Found Trends\u00ae Mach Learn"},{"key":"9825_CR14","doi-asserted-by":"crossref","unstructured":"Bengio Y (2013) Deep learning of representations: looking forward. In: International conference on statistical language and speech processing. Springer, pp 1\u201337","DOI":"10.1007\/978-3-642-39593-2_1"},{"key":"9825_CR15","doi-asserted-by":"crossref","unstructured":"Bengio Y, Lamblin P, Popovici D, Larochelle H (2007) Greedy layer-wise training of deep networks. In: Advances in neural information processing systems. The MIT Press, pp 153\u2013160","DOI":"10.7551\/mitpress\/7503.003.0024"},{"key":"9825_CR16","doi-asserted-by":"publisher","first-page":"1798","DOI":"10.1109\/TPAMI.2013.50","volume":"35","author":"Y Bengio","year":"2013","unstructured":"Bengio Y, Courville A, Vincent P (2013) Representation learning: a review and new perspectives. IEEE Trans Pattern Anal Mach Intell 35:1798\u20131828. https:\/\/doi.org\/10.1109\/TPAMI.2013.50","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR17","unstructured":"Berg A, Deng J, Fei-Fei L (2010) Large scale visual recognition challenge 2010"},{"key":"9825_CR18","doi-asserted-by":"publisher","unstructured":"Bettoni M, Urgese G, Kobayashi Y, et al (2017) A convolutional neural network fully implemented on FPGA for embedded platforms. IEEE, pp 49\u201352. https:\/\/doi.org\/10.1109\/ngcas.2017.16","DOI":"10.1109\/ngcas.2017.16"},{"key":"9825_CR19","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1016\/j.patcog.2018.07.034","volume":"85","author":"AK Bhunia","year":"2019","unstructured":"Bhunia AK, Konwer A, Bhunia AK et al (2019) Script identification in natural scene image and video frames using an attention based Convolutional-LSTM network. Pattern Recognit 85:172\u2013184","journal-title":"Pattern Recognit"},{"key":"9825_CR20","unstructured":"Boureau Y (2009) Icml2010B.Pdf. doi: citeulike-article-id:8496352"},{"key":"9825_CR21","doi-asserted-by":"crossref","unstructured":"Bouvrie J (2006) 1 Introduction Notes on Convolutional Neural Networks. doi: http:\/\/dx.doi.org\/10.1016\/j.protcy.2014.09.007","DOI":"10.1016\/j.protcy.2014.09.007"},{"key":"9825_CR22","first-page":"717","volume-title":"Computer vision\u2014ECCV","author":"A Bulat","year":"2016","unstructured":"Bulat A, Tzimiropoulos G (2016) Human pose estimation via convolutional part heatmap regression BT. In: Leibe B, Matas J, Sebe N, Welling M (eds) Computer vision\u2014ECCV. Springer, Cham, pp 717\u2013732"},{"key":"9825_CR23","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2019.2956516","author":"Z Cai","year":"2019","unstructured":"Cai Z, Vasconcelos N (2019) Cascade R-CNN: high quality object detection and instance segmentation. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/tpami.2019.2956516","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR24","doi-asserted-by":"publisher","first-page":"1055","DOI":"10.1109\/72.788646","volume":"10","author":"O Chapelle","year":"1998","unstructured":"Chapelle O (1998) Support vector machines for image classification. Stage deuxi\u00e8me ann\u00e9e magist\u00e8re d\u2019informatique l\u2019\u00c9cole Norm Sup\u00e9rieur Lyon 10:1055\u20131064. https:\/\/doi.org\/10.1109\/72.788646","journal-title":"Stage deuxi\u00e8me ann\u00e9e magist\u00e8re d\u2019informatique l\u2019\u00c9cole Norm Sup\u00e9rieur Lyon"},{"key":"9825_CR25","unstructured":"Chellapilla K, Puri S, Simard P (2006) High performance convolutional neural networks for document processing. In: Tenth international workshop on frontiers in handwriting recognition"},{"key":"9825_CR26","unstructured":"Chen Y-N, Han C-C, Wang C-T et al (2006) The application of a convolution neural network on face and license plate detection. In: 18th international conference on pattern recognition, 2006. ICPR 2006, pp 552\u2013555"},{"key":"9825_CR27","unstructured":"Chen W, Wilson JT, Tyree S et al (2015) Compressing neural networks with the hashing trick. In: 32nd international conference on machine learning, ICML 2015"},{"key":"9825_CR28","doi-asserted-by":"crossref","unstructured":"Chevalier M, Thome N, Cord M et al (2015) LR-CNN for fine-grained classification with varying resolution. In: 2015 IEEE international conference on image processing (ICIP). IEEE, pp 3101\u20133105","DOI":"10.1109\/ICIP.2015.7351374"},{"key":"9825_CR29","doi-asserted-by":"crossref","unstructured":"Chollet F (2017) Xception: deep learning with depthwise separable convolutions. arXiv:1610.02357","DOI":"10.1109\/CVPR.2017.195"},{"key":"9825_CR30","doi-asserted-by":"publisher","first-page":"105612","DOI":"10.1016\/j.asoc.2019.105612","volume":"83","author":"N Chouhan","year":"2019","unstructured":"Chouhan N, Khan A (2019) Network anomaly detection using channel boosted and residual learning based deep convolutional neural network. Appl Soft Comput 83:105612","journal-title":"Appl Soft Comput"},{"key":"9825_CR31","doi-asserted-by":"publisher","first-page":"3207","DOI":"10.1162\/NECO_a_00052","volume":"22","author":"DC Cire\u015fan","year":"2010","unstructured":"Cire\u015fan DC, Meier U, Gambardella LM, Schmidhuber J (2010) Deep, big, simple neural nets for handwritten. Neural Comput 22:3207\u20133220","journal-title":"Neural Comput"},{"key":"9825_CR32","unstructured":"Cire\u015fan DC, Meier U, Masci J et al (2011) High-performance neural networks for visual object classification. Preprint arXiv:1102.0183"},{"key":"9825_CR33","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.neunet.2012.02.023","volume":"32","author":"D Cire\u015fan","year":"2012","unstructured":"Cire\u015fan D, Meier U, Masci J, Schmidhuber J (2012a) Multi-column deep neural network for traffic sign classification. Neural Netw 32:333\u2013338. https:\/\/doi.org\/10.1016\/j.neunet.2012.02.023","journal-title":"Neural Netw"},{"key":"9825_CR34","unstructured":"Cire\u015fan D, Giusti A, Gambardella LM, Schmidhuber J (2012b) Deep neural networks segment neuronal membranes in electron microscopy images. In: Advances in neural information processing systems, pp 2843\u20132851"},{"key":"9825_CR35","unstructured":"Cire\u015fan DC, Giusti A, Gambardella LM, Schmidhuber J (2013) Mitosis detection in breast cancer histology images with deep neural networks BT. In: Proceedings of medical image computing and computer-assisted intervention, MICCAI 2013, pp 411\u2013418"},{"key":"9825_CR36","unstructured":"Cire\u015fan DC, Cire\u015fan DC, Meier U, Schmidhuber J (2018) Multi-column deep neural networks for image classification. In: IEEE conference on computer vision and pattern recognition"},{"key":"9825_CR37","doi-asserted-by":"crossref","unstructured":"Collobert R, Weston J (2008) A unified architecture for natural language processing: Deep neural networks with multitask learning. In: Proceedings of the 25th international conference on Machine learning. ACM, pp 160\u2013167","DOI":"10.1145\/1390156.1390177"},{"key":"9825_CR38","unstructured":"Cs\u00e1ji B (2001) Approximation with artificial neural networks. M.Sc. Thesis 45"},{"key":"9825_CR39","unstructured":"Dahl G, Mohamed A, Hinton GE (2010) Phone recognition with the mean-covariance restricted Boltzmann machine. In: Advances in neural information processing systems, pp 469\u2013477"},{"key":"9825_CR40","doi-asserted-by":"crossref","unstructured":"Dahl GE, Sainath TN, Hinton GE (2013) Improving deep neural networks for LVCSR using rectified linear units and dropout. In: 2013 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp 8609\u20138613","DOI":"10.1109\/ICASSP.2013.6639346"},{"key":"9825_CR41","doi-asserted-by":"publisher","DOI":"10.1016\/j.jpowsour.2007.02.075","author":"J Dai","year":"2016","unstructured":"Dai J, Li Y, He K, Sun J (2016) R-FCN: object detection via region-based fully convolutional networks. J Power Sources. https:\/\/doi.org\/10.1016\/j.jpowsour.2007.02.075","journal-title":"J Power Sources"},{"key":"9825_CR42","doi-asserted-by":"publisher","unstructured":"Dalal N, Triggs W (2004) Histograms of oriented gradients for human detection. In: IEEE computer society conference on computer vision and pattern recognition CVPR05, vol. 1, pp 886\u2013893. https:\/\/doi.org\/10.1109\/cvpr.2005.177","DOI":"10.1109\/cvpr.2005.177"},{"key":"9825_CR43","unstructured":"Dauphin YN, De Vries H, Bengio Y (2015) Equilibrated adaptive learning rates for non-convex optimization. In: Advances in neural information processing system 2015, January, pp 1504\u20131512"},{"key":"9825_CR44","unstructured":"Dauphin YN, Fan A, Auli M, Grangier D (2017) Language modeling with gated convolutional networks. In: Proceedings of the 34th international conference on machine learning, vol 70, pp 933\u2013941"},{"key":"9825_CR45","unstructured":"de Vries H, Memisevic R, Courville A (2016) Deep learning vector quantization. In: European symposium on artificial neural networks, computational intelligence and machine learning"},{"key":"9825_CR46","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1023\/A:1012454411458","volume":"46","author":"D Decoste","year":"2002","unstructured":"Decoste D, Sch\u00f6lkopf B (2002) Training invariant support vector machines. Mach Learn 46:161\u2013190","journal-title":"Mach Learn"},{"key":"9825_CR47","unstructured":"Delalleau O, Bengio Y (2011) Shallow versus deep sum-product networks. In: Advances in neural information processing systems, pp 666\u2013674"},{"key":"9825_CR48","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1109\/MSP.2012.2211477","volume":"29","author":"L Deng","year":"2012","unstructured":"Deng L (2012) The MNIST database of handwritten digit images for machine learning research [best of the web]. IEEE Signal Process Mag 29:141\u2013142","journal-title":"IEEE Signal Process Mag"},{"key":"9825_CR49","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1561\/2000000039","volume":"7","author":"L Deng","year":"2013","unstructured":"Deng L, Yu D, Delft B (2013) Deep learning: methods and applications foundations and trends R in signal processing. Sig Process 7:3\u20134. https:\/\/doi.org\/10.1561\/2000000039","journal-title":"Sig Process"},{"key":"9825_CR50","doi-asserted-by":"publisher","first-page":"2091","DOI":"10.1109\/TIP.2005.859376","volume":"14","author":"MN Do","year":"2005","unstructured":"Do MN, Vetterli M (2005) The contourlet transform: an efficient directional multiresolution image representation. IEEE Trans Image Process 14:2091\u20132106","journal-title":"IEEE Trans Image Process"},{"key":"9825_CR51","doi-asserted-by":"crossref","unstructured":"Doll\u00e1r P, Tu Z, Perona P, Belongie S (2009) Integral channel features","DOI":"10.5244\/C.23.91"},{"key":"9825_CR52","doi-asserted-by":"crossref","unstructured":"Donahue J, Anne Hendricks L, Guadarrama S et al (2015) Long-term recurrent convolutional networks for visual recognition and description. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2625\u20132634","DOI":"10.1109\/CVPR.2015.7298878"},{"key":"9825_CR53","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1109\/TPAMI.2015.2439281","volume":"38","author":"C Dong","year":"2016","unstructured":"Dong C, Loy CC, He K, Tang X (2016) Image super-resolution using deep convolutional networks. IEEE Trans Pattern Anal Mach Intell 38:295\u2013307","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR54","first-page":"1","volume":"1341","author":"D Erhan","year":"2009","unstructured":"Erhan D, Bengio Y, Courville A, Vincent P (2009) Visualizing higher-layer features of a deep network. Univ Montr 1341:1","journal-title":"Univ Montr"},{"key":"9825_CR55","doi-asserted-by":"crossref","unstructured":"Farfade SS, Saberian MJ, Li L-J (2015) Multi-view face detection using deep convolutional neural networks. In: Proceedings of the 5th ACM on international conference on multimedia retrieval\u2014ICMR\u201915. ACM Press, New York, USA, pp 643\u2013650","DOI":"10.1145\/2671188.2749408"},{"key":"9825_CR56","doi-asserted-by":"crossref","unstructured":"Fasel B (2002) Facial expression analysis using shape and motion information extracted by convolutional neural networks. In: Proceedings of the 2002 12th IEEE workshop on neural networks for signal processing, 2002, pp 607\u2013616","DOI":"10.1109\/NNSP.2002.1030072"},{"key":"9825_CR57","doi-asserted-by":"crossref","unstructured":"Frizzi S, Kaabi R, Bouchouicha M et al (2016) Convolutional neural network for video fire and smoke detection. In: IECON 2016-42nd annual conference of the IEEE industrial electronics society. IEEE, pp 877\u2013882","DOI":"10.1109\/IECON.2016.7793196"},{"key":"9825_CR58","doi-asserted-by":"crossref","unstructured":"Frome A, Cheung G, Abdulkader A, et al (2009) Large-scale privacy protection in Google Street View. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2009.5459413"},{"key":"9825_CR59","unstructured":"Frosst N, Hinton G (2018) Distilling a neural network into a soft decision tree. In: CEUR workshop proceedings"},{"key":"9825_CR60","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1016\/0893-6080(88)90014-7","volume":"1","author":"K Fukushima","year":"1988","unstructured":"Fukushima K (1988) Neocognitron: a hierarchical neural network capable of visual pattern recognition. Neural Netw 1:119\u2013130","journal-title":"Neural Netw"},{"key":"9825_CR61","doi-asserted-by":"crossref","unstructured":"Fukushima K, Miyake S (1982) Neocognitron: a self-organizing neural network model for a mechanism of visual pattern recognition. In: Competition and cooperation in neural nets. Springer, pp 267\u2013285","DOI":"10.1007\/978-3-642-46466-9_18"},{"key":"9825_CR62","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2004.97","author":"C Garcia","year":"2004","unstructured":"Garcia C, Delakis M (2004) Convolutional face finder: a neural architecture for fast and robust face detection. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2004.97","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR63","doi-asserted-by":"publisher","first-page":"2627","DOI":"10.1016\/S1352-2310(97)00447-0","volume":"32","author":"MW Gardner","year":"1998","unstructured":"Gardner MW, Dorling SR (1998) Artificial neural networks (the multilayer perceptron)\u2014a review of applications in the atmospheric sciences. Atmos Environ 32:2627\u20132636","journal-title":"Atmos Environ"},{"key":"9825_CR64","doi-asserted-by":"crossref","unstructured":"Geng X, Lin J, Zhao B et al (2019) Hardware-aware softmax approximation for deep neural networks. In: Lecture notes in computer science. Lecture notes in artificial intelligence, Lecture notes in bioinformatics. pp 107\u2013122","DOI":"10.1007\/978-3-030-20870-7_7"},{"key":"9825_CR66","doi-asserted-by":"publisher","unstructured":"Gidaris S, Komodakis N (2015) Object detection via a multi-region and semantic segmentation-aware U model. In: Proceedings of IEEE international conference on computer vision 2015, pp 1134\u20131142. https:\/\/doi.org\/10.1109\/iccv.2015.135","DOI":"10.1109\/iccv.2015.135"},{"key":"9825_CR67","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast R-CNN. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2015.169"},{"key":"9825_CR68","doi-asserted-by":"crossref","unstructured":"Giusti A, Cire\u015fan DC, Masci J et al (2013) Fast image scanning with deep max-pooling convolutional neural networks. In: 2013 IEEE international conference on image processing. IEEE, pp 4034\u20134038","DOI":"10.1109\/ICIP.2013.6738831"},{"key":"9825_CR69","unstructured":"Glorot X, Bengio Y (2010) Understanding the difficulty of training deep feedforward neural networks. In: Proceedings of the thirteenth international conference on artificial intelligence and statistics, pp 249\u2013256"},{"key":"9825_CR70","unstructured":"Goh H, Thome N, Cord M, Lim J-H (2013) Top-down regularization of deep belief networks. In: Advances in neural information processing systems (NIPS). pp 1878\u20131886"},{"key":"9825_CR71","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1038\/nmeth.3707","volume":"13","author":"I Goodfellow","year":"2017","unstructured":"Goodfellow I, Bengio Y, Courville A (2017) Deep learning. Nat Methods 13:35. https:\/\/doi.org\/10.1038\/nmeth.3707","journal-title":"Nat Methods"},{"key":"9825_CR72","doi-asserted-by":"publisher","first-page":"20180013","DOI":"10.1098\/rsfs.2018.0013","volume":"8","author":"K Grill-Spector","year":"2018","unstructured":"Grill-Spector K, Weiner KS, Gomez J et al (2018) The functional neuroanatomy of face perception: from brain measurements to deep neural networks. Interface Focus 8:20180013. https:\/\/doi.org\/10.1098\/rsfs.2018.0013","journal-title":"Interface Focus"},{"key":"9825_CR73","doi-asserted-by":"publisher","unstructured":"Gr\u00fcn F, Rupprecht C, Navab N, Tombari F (2016) A taxonomy and library for visualizing learned features in convolutional neural networks. https:\/\/doi.org\/10.1080\/10962247.2014.948229","DOI":"10.1080\/10962247.2014.948229"},{"key":"9825_CR74","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1016\/j.patcog.2017.10.013","volume":"77","author":"J Gu","year":"2018","unstructured":"Gu J, Wang Z, Kuen J et al (2018) Recent advances in convolutional neural networks. Pattern Recognit 77:354\u2013377. https:\/\/doi.org\/10.1016\/j.patcog.2017.10.013","journal-title":"Pattern Recognit"},{"key":"9825_CR75","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.neucom.2015.09.116","volume":"187","author":"Y Guo","year":"2016","unstructured":"Guo Y, Liu Y, Oerlemans A et al (2016) Deep learning for visual understanding: a review. Neurocomputing 187:27\u201348. https:\/\/doi.org\/10.1016\/j.neucom.2015.09.116","journal-title":"Neurocomputing"},{"key":"9825_CR76","unstructured":"Hamel P, Eck D (2010) Learning features from music audio with deep belief networks. In: ISMIR, Utrecht, The Netherlands, pp 339\u2013344"},{"key":"9825_CR77","unstructured":"Han S, Mao H, Dally WJ (2016) Deep compression: compressing deep neural networks with pruning, trained quantization and Huffman coding. In: 4th international conference on learning representations, ICLR 2016\u2014conference track proceedings"},{"key":"9825_CR78","doi-asserted-by":"crossref","unstructured":"Han D, Kim J, Kim J (2017) Deep pyramidal residual networks. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 6307\u20136315","DOI":"10.1109\/CVPR.2017.668"},{"key":"9825_CR79","doi-asserted-by":"publisher","unstructured":"Han W, Feng R, Wang L, Gao L (2018) Adaptive spatial-scale-aware deep convolutional neural network for high-resolution remote sensing imagery scene classification. In: IGARSS 2018\u20132018 IEEE international geoscience and remote sensing symposium, pp 4736\u20134739. https:\/\/doi.org\/10.1109\/igarss.2018.8518290","DOI":"10.1109\/igarss.2018.8518290"},{"key":"9825_CR80","unstructured":"Hanin B, Sellke M (2017) Approximating continuous functions by ReLU Nets of minimal width. Preprint. arXiv:1710.11278"},{"key":"9825_CR81","doi-asserted-by":"publisher","first-page":"10437","DOI":"10.1007\/s11042-017-4440-4","volume":"77","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015a) Deep residual learning for image recognition. Multimed Tools Appl 77:10437\u201310453. https:\/\/doi.org\/10.1007\/s11042-017-4440-4","journal-title":"Multimed Tools Appl"},{"key":"9825_CR82","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015b) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37:1904\u20131916","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR83","doi-asserted-by":"crossref","unstructured":"He K, Gkioxari G, Dollar P, Girshick R (2017) Mask R-CNN. In: Proceedings of the IEEE international conference on computer vision","DOI":"10.1109\/ICCV.2017.322"},{"key":"9825_CR84","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1016\/j.patcog.2008.08.014","volume":"42","author":"M Heikkil\u00e4","year":"2009","unstructured":"Heikkil\u00e4 M, Pietik\u00e4inen M, Schmid C (2009) Description of interest regions with local binary patterns. Pattern Recognit 42:425\u2013436. https:\/\/doi.org\/10.1016\/j.patcog.2008.08.014","journal-title":"Pattern Recognit"},{"key":"9825_CR85","doi-asserted-by":"publisher","first-page":"1527","DOI":"10.1162\/neco.2006.18.7.1527","volume":"18","author":"GE Hinton","year":"2006","unstructured":"Hinton GE, Osindero S, Teh Y-W (2006) A fast learning algorithm for deep belief nets. Neural Comput 18:1527\u20131554","journal-title":"Neural Comput"},{"key":"9825_CR86","doi-asserted-by":"crossref","unstructured":"Hinton GE, Krizhevsky A, Wang SD (2011) Transforming auto-encoders. In: International conference on artificial neural networks. Springer, pp 44\u201351","DOI":"10.1007\/978-3-642-21735-7_6"},{"key":"9825_CR87","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","volume":"29","author":"G Hinton","year":"2012","unstructured":"Hinton G, Deng L, Yu D et al (2012a) Deep neural networks for acoustic modeling in speech recognition: the shared views of four research groups. IEEE Signal Process Mag 29:82\u201397","journal-title":"IEEE Signal Process Mag"},{"key":"9825_CR88","unstructured":"Hinton GE, Srivastava N, Krizhevsky A, et al (2012b) Improving neural networks by preventing co-adaptation of feature detectors. pp 1\u201318. arXiv:12070580"},{"key":"9825_CR89","unstructured":"Hinton G, Sabour S, Frosst N (2018) Matrix capsules with EM routing. In: 6th international conference on learning representations, ICLR 2018 - conference track proceedings"},{"key":"9825_CR90","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1142\/S0218488598000094","volume":"6","author":"S Hochreiter","year":"1998","unstructured":"Hochreiter S (1998) The vanishing gradient problem during learning recurrent neural nets and problem solutions. Int J Uncertain Fuzziness Knowl-Based Syst 6:107\u2013116","journal-title":"Int J Uncertain Fuzziness Knowl-Based Syst"},{"key":"9825_CR91","unstructured":"Howard AG, Zhu M, Chen B, et al (2017) MobileNets: Efficient Convolutional Neural Networks for Mobile Vision Applications. arXiv:170404861"},{"key":"9825_CR92","unstructured":"Hu B, Lu Z, Li H, Chen Q (2011) Topic modeling for named entity queries. In: Proceedings of the 20th ACM international conference on Information and knowledge management\u2014CIKM\u201911. ACM Press, New York, New York, USA, 2009"},{"key":"9825_CR93","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018a) Squeeze-and-excitation networks. In: 2018 IEEE\/CVF conference on computer vision and pattern recognition. IEEE, pp 7132\u20137141","DOI":"10.1109\/CVPR.2018.00745"},{"key":"9825_CR94","unstructured":"Hu Y, Wen G, Luo M, et al (2018b) Competitive inner-imaging squeeze and excitation for residual network. arXiv:1807.08920v3"},{"key":"9825_CR96","doi-asserted-by":"crossref","unstructured":"Huang G, Sun Y, Liu Z et al (2016a) Deep networks with stochastic depth. In: European conference on computer vision. Springer, pp 646\u2013661","DOI":"10.1007\/978-3-319-46493-0_39"},{"key":"9825_CR97","doi-asserted-by":"crossref","unstructured":"Huang G, Sun Y, Liu Z et al (2016b) Deep networks with stochastic depth BT. In: European conference on computer vision ECCV 2016. Springer, pp 646\u2013661","DOI":"10.1007\/978-3-319-46493-0_39"},{"key":"9825_CR98","doi-asserted-by":"publisher","unstructured":"Huang G, Liu Z, Van Der Maaten L, Weinberger KQ (2017) Densely connected convolutional networks. In: Proceedings of 30th IEEE conference on computer vision and pattern recognition, CVPR 2017, pp 2261\u20132269. https:\/\/doi.org\/10.1109\/cvpr.2017.243","DOI":"10.1109\/cvpr.2017.243"},{"key":"9825_CR99","unstructured":"Huang Y, Cheng Y, Chen D et al (2018) GPipe: efficient training of giant neural networks using pipeline parallelism. arXiv:1811.06965v3"},{"key":"9825_CR100","doi-asserted-by":"crossref","unstructured":"Huang KY, Wu CH, Hong QB et al (2019) Speech emotion recognition using deep neural network considering verbal and nonverbal speech sounds. In: Proceedings of IEEE international conference on acoustics, speech and signal processing ICASSP","DOI":"10.1109\/ICASSP.2019.8682283"},{"key":"9825_CR101","doi-asserted-by":"publisher","DOI":"10.1113\/jphysiol.1959.sp006308","author":"DH Hubel","year":"1959","unstructured":"Hubel DH, Wiesel TN (1959) Receptive fields of single neurones in the cat\u2019s striate cortex. J Physiol. https:\/\/doi.org\/10.1113\/jphysiol.1959.sp006308","journal-title":"J Physiol"},{"key":"9825_CR102","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1113\/jphysiol.1962.sp006837","volume":"160","author":"DH Hubel","year":"1962","unstructured":"Hubel DH, Wiesel TN (1962) Receptive fields, binocular interaction and functional architecture in the cat\u2019s visual cortex. J Physiol 160:106\u2013154. https:\/\/doi.org\/10.1113\/jphysiol.1962.sp006837","journal-title":"J Physiol"},{"key":"9825_CR103","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1113\/jphysiol.1968.sp008455","volume":"195","author":"DH Hubel","year":"1968","unstructured":"Hubel DH, Wiesel TN (1968) Receptive fields and functional architecture of monkey striate cortex. J Physiol 195:215\u2013243. https:\/\/doi.org\/10.1113\/jphysiol.1968.sp008455","journal-title":"J Physiol"},{"key":"9825_CR104","doi-asserted-by":"publisher","DOI":"10.1016\/j.molstruc.2016.12.061","author":"S Ioffe","year":"2015","unstructured":"Ioffe S, Szegedy C (2015) Batch normalization: accelerating deep network training by reducing internal covariate shift. J Mol Struct. https:\/\/doi.org\/10.1016\/j.molstruc.2016.12.061","journal-title":"J Mol Struct"},{"key":"9825_CR105","doi-asserted-by":"publisher","DOI":"10.1038\/nbt.3343","author":"M Jaderberg","year":"2015","unstructured":"Jaderberg M, Simonyan K, Zisserman A, Kavukcuoglu K (2015) Spatial transformer networks. Nature. https:\/\/doi.org\/10.1038\/nbt.3343","journal-title":"Nature"},{"key":"9825_CR106","doi-asserted-by":"crossref","unstructured":"Jarrett K, Kavukcuoglu K, Ranzato M, LeCun Y (2009) What is the best multi-stage architecture for object recognition? In: IEEE 12th international conference on comput vision, 2009, pp 2146\u20132153","DOI":"10.1109\/ICCV.2009.5459469"},{"key":"9825_CR107","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1109\/TPAMI.2012.59","volume":"35","author":"S Ji","year":"2010","unstructured":"Ji S, Yang M, Yu K, Xu W (2010) 3D convolutional neural networks for human action recognition. Int Conf Mach Learn 35:221\u2013231. https:\/\/doi.org\/10.1109\/TPAMI.2012.59","journal-title":"Int Conf Mach Learn"},{"key":"9825_CR108","doi-asserted-by":"crossref","unstructured":"Joachims T (1998) Text categorization with support vector machines: Learning with many relevant features. In: European conference on machine learning. pp 137\u2013142","DOI":"10.1007\/BFb0026683"},{"key":"9825_CR109","unstructured":"Justus D, Brennan J, Bonner S, McGough AS (2019) Predicting the computational cost of deep learning models. In: Proceedings of 2018 IEEE international conference on big data, Big Data 2018"},{"key":"9825_CR110","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/j.rvsc.2015.01.001","volume":"99","author":"M Kafi","year":"2015","unstructured":"Kafi M, Maleki M, Davoodian N (2015) Functional histology of the ovarian follicles as determined by follicular fluid concentrations of steroids and IGF-1 in Camelus dromedarius. Res Vet Sci 99:37\u201340. https:\/\/doi.org\/10.1016\/j.rvsc.2015.01.001","journal-title":"Res Vet Sci"},{"key":"9825_CR111","doi-asserted-by":"publisher","first-page":"310","DOI":"10.1109\/TVCG.2018.2864500","volume":"25","author":"M Kahng","year":"2019","unstructured":"Kahng M, Thorat N, Chau DHP et al (2019) GAN Lab: understanding complex deep generative models using interactive visual experimentation. IEEE Trans Vis Comput Graph\u00a025:310\u2013320","journal-title":"IEEE Trans Vis Comput Graph"},{"key":"9825_CR112","doi-asserted-by":"crossref","unstructured":"Kalchbrenner N, Grefenstette E, Blunsom P (2014) A convolutional neural network for modelling sentences. Preprint arXiv:1404.2188","DOI":"10.3115\/v1\/P14-1062"},{"key":"9825_CR114","doi-asserted-by":"crossref","unstructured":"Kawashima T, Kawanishi Y, Ide I et al (2017) Action recognition from extremely low-resolution thermal image sequence. In: 2017 14th IEEE international conference on advanced video and signal based surveillance, AVSS 2017. IEEE, pp 1\u20136","DOI":"10.1109\/AVSS.2017.8078497"},{"key":"9825_CR113","doi-asserted-by":"publisher","first-page":"1462","DOI":"10.1162\/neco_a_01195","volume":"31","author":"K Kawaguchi","year":"2019","unstructured":"Kawaguchi K, Huang J, Kaelbling LP (2019) Effect of depth and width on local minima in deep learning. Neural Comput 31:1462\u20131498. https:\/\/doi.org\/10.1162\/neco_a_01195","journal-title":"Neural Comput"},{"key":"9825_CR115","unstructured":"Khan A, Sohail A, Ali A (2018a) A New channel boosted convolutional neural network using transfer learning. Preprint arXiv:1804.08528"},{"key":"9825_CR116","unstructured":"Khan A, Zameer A, Jamal T, Raza A (2018b) Deep belief networks based feature generation and regression for predicting wind power. Preprint arXiv:1807.11682"},{"key":"9825_CR117","unstructured":"Khan A, Qureshi AS, Hussain M et al (2019) A recent survey on the applications of genetic programming in image processing. Preprint arXiv:1901.07387"},{"key":"9825_CR118","doi-asserted-by":"publisher","DOI":"10.1061\/(ASCE)GT.1943-5606.0001284","author":"A Krizhevsky","year":"2012","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2012) ImageNet classification with deep convolutional neural networks. Adv Neural Inf Process Syst. https:\/\/doi.org\/10.1061\/(ASCE)GT.1943-5606.0001284","journal-title":"Adv Neural Inf Process Syst"},{"key":"9825_CR119","doi-asserted-by":"crossref","unstructured":"Kuen J, Kong X, Wang G et al (2017) DelugeNets: deep networks with efficient and flexible cross-layer information inflows. In: 2017 IEEE international conference on computer vision workshop (ICCVW), pp 958\u2013966","DOI":"10.1109\/ICCVW.2017.117"},{"key":"9825_CR120","doi-asserted-by":"publisher","unstructured":"Kuen J, Kong X, Wang G, Tan YP (2018) DelugeNets: deep networks with efficient and flexible cross-layer information inflows. In: Proceedings of IEEE international conference on computer vision work ICCVW 2017, pp 958\u2013966. https:\/\/doi.org\/10.1109\/iccvw.2017.117","DOI":"10.1109\/iccvw.2017.117"},{"key":"9825_CR121","unstructured":"Lacey G, Taylor GW, Areibi S (2016) Deep learning on FPGAs: past, present, and future. arXiv:160204283"},{"key":"9825_CR122","unstructured":"Larsson G, Maire M, Shakhnarovich G (2016) Fractalnet: ultra-deep neural networks without residuals. Preprint 1605.07648, pp 1\u201311"},{"key":"9825_CR123","unstructured":"Laskar MNU, Giraldo LGS, Schwartz O (2018) Correspondence of deep neural networks and the brain for visual textures, pp 1\u201317"},{"key":"9825_CR124","doi-asserted-by":"publisher","unstructured":"Le QV, Ranzato M, Monga R et al (2011) Building high-level features using large scale unsupervised learning. In: IEEE International conference on acoustics speech and signal processing ICASSP, pp 8595\u20138598. https:\/\/doi.org\/10.1109\/icassp.2013.6639343","DOI":"10.1109\/icassp.2013.6639343"},{"key":"9825_CR125","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1037\/0096-3445.136.1.23","volume":"136","author":"Y LeCun","year":"2007","unstructured":"LeCun Y (2007) Effcient BackPrp. J Exp Psychol Gen 136:23\u201342","journal-title":"J Exp Psychol Gen"},{"key":"9825_CR126","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1162\/neco.1989.1.4.541","volume":"1","author":"Y LeCun","year":"1989","unstructured":"LeCun Y, Boser B, Denker JS et al (1989) Backpropagation applied to handwritten zip code recognition. Neural Comput 1:541\u2013551","journal-title":"Neural Comput"},{"key":"9825_CR127","first-page":"276","volume":"261","author":"Y LeCun","year":"1995","unstructured":"LeCun Y, Jackel LD, Bottou L et al (1995) Learning algorithms for classification: a comparison on handwritten digit recognition. Neural Netw Stat Mech Perspect 261:276","journal-title":"Neural Netw Stat Mech Perspect"},{"key":"9825_CR128","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun Y, Bottou L, Bengio Y, Haffner P (1998) Gradient-based learning applied to document recognition. Proc IEEE 86:2278\u20132324","journal-title":"Proc IEEE"},{"key":"9825_CR129","doi-asserted-by":"crossref","unstructured":"LeCun Y, Kavukcuoglu K, Farabet CC et al (2010) Convolutional networks and applications in vision. In: ISCAS. IEEE, pp 253\u2013256","DOI":"10.1109\/ISCAS.2010.5537907"},{"key":"9825_CR130","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton G (2015) Deep learning. Nature 521:436\u2013444. https:\/\/doi.org\/10.1038\/nature14539","journal-title":"Nature"},{"key":"9825_CR131","unstructured":"Lee C-Y, Gallagher PW, Tu Z (2016) Generalizing pooling functions in convolutional neural networks: mixed, gated, and tree. In: Artificial intelligence and statistics, pp 464\u2013472"},{"key":"9825_CR132","doi-asserted-by":"crossref","unstructured":"Lee S, Son K, Kim H, Park J (2017) Car plate recognition based on CNN using embedded system with GPU, pp 239\u2013241","DOI":"10.1109\/HSI.2017.8005037"},{"key":"9825_CR133","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2015.7301352","author":"G Levi","year":"2009","unstructured":"Levi G, Hassner T (2009) Sicherheit und Medien. Sicherheit und Medien. https:\/\/doi.org\/10.1109\/CVPRW.2015.7301352","journal-title":"Sicherheit und Medien"},{"key":"9825_CR134","doi-asserted-by":"crossref","unstructured":"Li S, Liu Z-Q, Chan AB (2014) Heterogeneous multi-task learning for human pose estimation with deep convolutional neural network. In: 2014 IEEE conference on computer vision and pattern recognition workshops. IEEE, pp 488\u2013495","DOI":"10.1109\/CVPRW.2014.78"},{"key":"9825_CR135","doi-asserted-by":"crossref","unstructured":"Li H, Lin Z, Shen X et al (2015) A convolutional neural network cascade for face detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5325\u20135334","DOI":"10.1109\/CVPR.2015.7299170"},{"key":"9825_CR136","doi-asserted-by":"crossref","unstructured":"Li X, Bing L, Lam W, Shi B (2018) Transformation networks for target-oriented sentiment classification, pp 946\u2013956","DOI":"10.18653\/v1\/P18-1087"},{"key":"9825_CR137","doi-asserted-by":"publisher","unstructured":"Lin M, Chen Q, Yan S (2013) Network in network, pp 1\u201310. https:\/\/doi.org\/10.1109\/asru.2015.7404828","DOI":"10.1109\/asru.2015.7404828"},{"key":"9825_CR138","unstructured":"Lin T-Y, Maire M, Belongie S et al (2014) Microsoft coco: common objects in context. In: European conference on computer vision. Springer, pp 740\u2013755"},{"key":"9825_CR139","doi-asserted-by":"crossref","unstructured":"Lin TY, Doll\u00e1r P, Girshick R et al (2017) Feature pyramid networks for object detection. In: Proceedings of 30th IEEE conference on computer vision and pattern recognition, CVPR 2017","DOI":"10.1109\/CVPR.2017.106"},{"key":"9825_CR140","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1109\/MM.2008.31","volume":"28","author":"E Lindholm","year":"2008","unstructured":"Lindholm E, Nickolls J, Oberman S, Montrym J (2008) NVIDIA TESLA: a unified graphics and computing architecture. IEEE Micro 28:39\u201355. https:\/\/doi.org\/10.1109\/MM.2008.31","journal-title":"IEEE Micro"},{"key":"9825_CR141","unstructured":"Linnainmaa S (1970) The representation of the cumulative rounding error of an algorithm as a Taylor expansion of the local rounding errors. Master\u2019s Thesis (in Finnish), Univ Helsinki 6\u20137"},{"key":"9825_CR142","doi-asserted-by":"publisher","first-page":"2271","DOI":"10.1016\/S0031-3203(03)00085-2","volume":"36","author":"C-L Liu","year":"2003","unstructured":"Liu C-L, Nakashima K, Sako H, Fujisawa H (2003) Handwritten digit recognition: benchmarking of state-of-the-art techniques. Pattern Recognit 36:2271\u20132285","journal-title":"Pattern Recognit"},{"key":"9825_CR143","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.neucom.2016.12.038","volume":"234","author":"W Liu","year":"2017","unstructured":"Liu W, Wang Z, Liu X et al (2017) A survey of deep neural network architectures and their applications. Neurocomputing 234:11\u201326. https:\/\/doi.org\/10.1016\/j.neucom.2016.12.038","journal-title":"Neurocomputing"},{"key":"9825_CR144","doi-asserted-by":"publisher","first-page":"1089","DOI":"10.1007\/s10462-018-9641-3","volume":"52","author":"X Liu","year":"2019","unstructured":"Liu X, Deng Z, Yang Y (2019) Recent progress in semantic image segmentation. Artif Intell Rev 52:1089\u20131106. https:\/\/doi.org\/10.1007\/s10462-018-9641-3","journal-title":"Artif Intell Rev"},{"key":"9825_CR145","doi-asserted-by":"publisher","unstructured":"Long ZM, Guo SQ, Chen GJ, Yin BL (2012) Modeling and simulation for the articulated robotic arm test system of the combination drive. In: 2011 international conference on mechatronics and materials engineering ICMME 2011, pp 151:480\u2013483. https:\/\/doi.org\/10.4028\/www.scientific.net\/AMM.151.480","DOI":"10.4028\/www.scientific.net\/AMM.151.480"},{"key":"9825_CR146","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional networks for semantic segmentation. In: 2015 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"9825_CR147","doi-asserted-by":"publisher","unstructured":"Lowe DG (1999) Object recognition from local scale-invariant features. In: Proceedings of Seventh IEEE International Conference on Computer Vision, vol 2, pp 1150\u20131157. https:\/\/doi.org\/10.1109\/iccv.1999.790410","DOI":"10.1109\/iccv.1999.790410"},{"key":"9825_CR148","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe DG (2004) Distinctive image features from scale-invariant keypoints. Int J Comput Vis 60:91\u2013110","journal-title":"Int J Comput Vis"},{"key":"9825_CR149","doi-asserted-by":"publisher","first-page":"e3927","DOI":"10.1002\/cpe.3927","volume":"29","author":"H Lu","year":"2017","unstructured":"Lu H, Li B, Zhu J et al (2017a) Wound intensity correction and segmentation with convolutional neural networks. Concurr Comput Pract Exp 29:e3927","journal-title":"Concurr Comput Pract Exp"},{"key":"9825_CR150","unstructured":"Lu Z, Pu H, Wang F et al (2017b) The expressive power of neural networks: a view from the width. In: Advances in neural information processing systems, pp 6231\u20136239"},{"key":"9825_CR151","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1007\/s10462-019-09708-5","volume":"52","author":"E Lv","year":"2019","unstructured":"Lv E, Wang X, Cheng Y, Yu Q (2019) Deep ensemble network based on multi-path fusion. Artif Intell Rev 52:151\u2013168. https:\/\/doi.org\/10.1007\/s10462-019-09708-5","journal-title":"Artif Intell Rev"},{"key":"9825_CR152","doi-asserted-by":"publisher","DOI":"10.1051\/epjconf\/201921406017","author":"CF Madrazo","year":"2019","unstructured":"Madrazo CF, Heredia I, Lloret L, Marco de Lucas J (2019) Application of a convolutional neural network for image classification for the analysis of collisions in high energy physics. EPJ Web Conf. https:\/\/doi.org\/10.1051\/epjconf\/201921406017","journal-title":"EPJ Web Conf"},{"key":"9825_CR153","unstructured":"Mao X, Shen C, Yang Y-B (2016) Image restoration using very deep convolutional encoder-decoder networks with symmetric skip connections. In: Advances in neural information processing systems, pp 2802\u20132810"},{"key":"9825_CR154","doi-asserted-by":"publisher","first-page":"473","DOI":"10.5194\/isprsannals-III-3-473-2016","volume":"3","author":"D Marmanis","year":"2016","unstructured":"Marmanis D, Wegner JD, Galliani S et al (2016) Semantic segmentation of aerial images with an ensemble of CNNs. ISPRS Ann Photogramm Remote Sens Spat Inf Sci 3:473","journal-title":"ISPRS Ann Photogramm Remote Sens Spat Inf Sci"},{"key":"9825_CR155","doi-asserted-by":"crossref","unstructured":"Matsugu M, Mori K, Ishii M, Mitarai Y (2002) Convolutional spiking neural network model for robust face detection. In: Proceedings of the 9th international conference on neural information processing, 2002. ICONIP\u201902, pp 660\u2013664","DOI":"10.1109\/ICONIP.2002.1198140"},{"key":"9825_CR156","doi-asserted-by":"crossref","unstructured":"Mikolov T, Karafi\u00e1t M, Burget L et al (2010) Recurrent neural network based language model. In: Eleventh annual conference of the international speech communication association","DOI":"10.1109\/ICASSP.2011.5947611"},{"key":"9825_CR157","unstructured":"Misra D (2019) Mish: a self regularized non-monotonic neural activation function. arXiv:190808681"},{"key":"9825_CR158","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1109\/TASL.2011.2109382","volume":"20","author":"A Mohamed","year":"2012","unstructured":"Mohamed A, Dahl GE, Hinton G (2012) Acoustic modeling using deep belief networks. IEEE Trans Audio Speech Lang Process 20:14\u201322","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"9825_CR159","unstructured":"Montufar GF, Pascanu R, Cho K, Bengio Y (2014) On the number of linear regions of deep neural networks. In: Advances in neural information processing systems, pp 2924\u20132932"},{"key":"9825_CR160","doi-asserted-by":"publisher","first-page":"903","DOI":"10.1109\/JSSC.2016.2636225","volume":"52","author":"B Moons","year":"2017","unstructured":"Moons B, Verhelst M (2017) An energy-efficient precision-scalable ConvNet processor in 40-nm CMOS. IEEE J Solid-State Circuits 52:903\u2013914","journal-title":"IEEE J Solid-State Circuits"},{"key":"9825_CR161","doi-asserted-by":"publisher","unstructured":"Morar A, Moldoveanu F, Gr\u00f6ller E (2012) Image segmentation based on active contours without edges. In: IEEE 8th international conference on intelligent computer communication processing ICCP 2012, pp 213\u2013220. https:\/\/doi.org\/10.1109\/iccp.2012.6356188","DOI":"10.1109\/iccp.2012.6356188"},{"key":"9825_CR162","unstructured":"Nair V, Hinton GE (2010) Rectified linear units improve restricted Boltzmann machines. In: ICML 27th international conference on machine learning"},{"key":"9825_CR163","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-014-0007-7","volume":"2","author":"MM Najafabadi","year":"2015","unstructured":"Najafabadi MM, Villanustre F, Khoshgoftaar TM et al (2015) Deep learning applications and challenges in big data analytics. J Big Data 2:1\u201321. https:\/\/doi.org\/10.1186\/s40537-014-0007-7","journal-title":"J Big Data"},{"key":"9825_CR164","unstructured":"Nguyen Q, Mukkamala M, Hein M (2018) Neural networks should be wide enough to learn disconnected decision regions. Preprint arXiv:1803.00094"},{"key":"9825_CR165","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1007\/s10462-018-09679-z","volume":"52","author":"G Nguyen","year":"2019","unstructured":"Nguyen G, Dlugolinsky S, Bob\u00e1k M et al (2019) Machine learning and deep learning frameworks and libraries for large-scale data mining: a survey. Artif Intell Rev 52:77\u2013124. https:\/\/doi.org\/10.1007\/s10462-018-09679-z","journal-title":"Artif Intell Rev"},{"key":"9825_CR166","doi-asserted-by":"crossref","unstructured":"Nickolls J, Buck I, Garland M, Skadron K (2008) Scalable parallel programming with CUDA. In: ACM SIGGRAPH 2008 classes on SIGGRAPH\u201908. ACM Press, New York, New York, USA, p 1","DOI":"10.1145\/1401132.1401152"},{"key":"9825_CR167","unstructured":"Nwankpa C, Ijomah W, Gachagan A, Marshall S (2018) Activation functions: comparison of trends in practice and research for deep learning. Preprint arXiv:1811.03378"},{"key":"9825_CR168","doi-asserted-by":"publisher","first-page":"1311","DOI":"10.1016\/j.patcog.2004.01.013","volume":"37","author":"K-S Oh","year":"2004","unstructured":"Oh K-S, Jung K (2004) GPU implementation of neural networks. Pattern Recognit 37:1311\u20131314","journal-title":"Pattern Recognit"},{"key":"9825_CR169","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1016\/0031-3203(95)00067-4","volume":"29","author":"T Ojala","year":"1996","unstructured":"Ojala T, Pietik\u00e4inen M, Harwood D (1996) A comparative study of texture measures with classification based on feature distributions. Pattern Recognit 29:51\u201359. https:\/\/doi.org\/10.1016\/0031-3203(95)00067-4","journal-title":"Pattern Recognit"},{"key":"9825_CR170","doi-asserted-by":"publisher","first-page":"971","DOI":"10.1109\/TPAMI.2002.1017623","volume":"247","author":"T Ojala","year":"2002","unstructured":"Ojala T, PeitiKainen M, Maenp\u00e3 T (2002) Multiresolution gray-scale and rotation invariant texture classification with local binary patterns. IEEE Trans Pattern Anal Mach Intell 247:971\u2013987","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR171","doi-asserted-by":"crossref","unstructured":"Oquab M, Bottou L, Laptev I, Sivic J (2014) Learning and transferring mid-level image representations using convolutional neural networks. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition. IEEE, pp 1717\u20131724","DOI":"10.1109\/CVPR.2014.222"},{"key":"9825_CR172","doi-asserted-by":"crossref","unstructured":"Pang J, Chen K, Shi J et al (2020) Libra R-CNN: towards balanced learning for object detection","DOI":"10.1109\/CVPR.2019.00091"},{"key":"9825_CR173","unstructured":"Pascanu R, Mikolov T, Bengio Y (2012) Understanding the exploding gradient problem. arXiv:1211.5063"},{"key":"9825_CR174","doi-asserted-by":"crossref","unstructured":"Peng X, Hoffman J, Yu SX, Saenko K (2016) Fine-to-coarse knowledge transfer for low-res image classification. In: 2016 IEEE international conference on image processing (ICIP). IEEE, pp 3683\u20133687","DOI":"10.1109\/ICIP.2016.7533047"},{"key":"9825_CR175","doi-asserted-by":"crossref","unstructured":"Potluri S, Fasih A, Vutukuru LK et al (2011) CNN based high performance computing for real time image processing on GPU. In: Proceedings of the joint INDS\u201911 & ISTET\u201911, pp 1\u20137","DOI":"10.1109\/INDS.2011.6024781"},{"key":"9825_CR176","unstructured":"Qureshi AS, Khan A (2018) Adaptive transfer learning in deep neural networks: wind power prediction using knowledge transfer from region to region and between different task domains. Preprint arXiv:1810.12611"},{"key":"9825_CR177","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1016\/j.asoc.2017.05.031","volume":"58","author":"AS Qureshi","year":"2017","unstructured":"Qureshi AS, Khan A, Zameer A, Usman A (2017) Wind power prediction using deep neural network based meta regression and transfer learning. Appl Soft Comput J 58:742\u2013755. https:\/\/doi.org\/10.1016\/j.asoc.2017.05.031","journal-title":"Appl Soft Comput J"},{"key":"9825_CR178","unstructured":"Ramachandran P, Zoph B, Le QV (2017) Swish: a self-gated activation function"},{"key":"9825_CR179","doi-asserted-by":"crossref","unstructured":"Ranjan R, Patel VM, Chellappa R (2015) A deep pyramid deformable part model for face detection. Preprint arXiv:1508.04389","DOI":"10.1109\/BTAS.2015.7358755"},{"key":"9825_CR95","doi-asserted-by":"crossref","unstructured":"Ranzato M, Huang FJ, Boureau YL, LeCun Y (2007) Unsupervised learning of invariant feature hierarchies with applications to object recognition. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition. IEEE, pp 1\u20138","DOI":"10.1109\/CVPR.2007.383157"},{"key":"9825_CR180","doi-asserted-by":"publisher","first-page":"1120","DOI":"10.1162\/NECO","volume":"61","author":"W Rawat","year":"2016","unstructured":"Rawat W, Wang Z (2016) Deep convolutional neural networks for image classification: a comprehensive review. Neural Comput 61:1120\u20131132. https:\/\/doi.org\/10.1162\/NECO","journal-title":"Neural Comput"},{"key":"9825_CR181","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031","author":"S Ren","year":"2015","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster R-CNN: towards real-time object detection with region proposal networks. Adv Neural Inf Process Syst. https:\/\/doi.org\/10.1109\/tpami.2016.2577031","journal-title":"Adv Neural Inf Process Syst"},{"key":"9825_CR182","doi-asserted-by":"crossref","unstructured":"Ronneberger O, Fischer P, Brox T (2015) U-net: convolutional networks for biomedical image segmentation. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"9825_CR183","doi-asserted-by":"publisher","unstructured":"Roy AG, Navab N, Wachinger C (2018) Concurrent spatial and channel \u2018squeeze & excitation\u2019 in fully convolutional networks. Lecture Notes in Computer Science (including Subser Lectue Notes in Artificial Intelligence Lecture Notes in Bioinformatics) 11070 LNCS:421\u2013429. https:\/\/doi.org\/10.1007\/978-3-030-00928-1_48","DOI":"10.1007\/978-3-030-00928-1_48"},{"key":"9825_CR184","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky O, Deng J, Su H et al (2015) imagenet large scale visual recognition challenge. Int J Comput Vis. https:\/\/doi.org\/10.1007\/s11263-015-0816-y","journal-title":"Int J Comput Vis"},{"key":"9825_CR185","unstructured":"Salakhutdinov R, Larochelle H (2010) Efficient learning of deep Boltzmann machines. In: Proceedings of the thirteenth international conference on artificial intelligence and statistics, pp 693\u2013700"},{"key":"9825_CR186","doi-asserted-by":"crossref","unstructured":"Scherer D, M\u00fcller A, Behnke S (2010) Evaluation of pooling operations in convolutional architectures for object recognition. In: Artificial neural networks\u2013ICANN 2010. Springer, pp 92\u2013101","DOI":"10.1007\/978-3-642-15825-4_10"},{"key":"9825_CR187","doi-asserted-by":"crossref","unstructured":"Schmidhuber J (2007) New millennium AI and the convergence of history. In: Challenges for computational intelligence. Springer, pp 15\u201335","DOI":"10.1007\/978-3-540-71984-7_2"},{"key":"9825_CR188","unstructured":"Sermanet P, Chintala S, Lecun Y (2012) Convolutional neural networks applied to house numbers digit classification. In: Proceedings of the 21st international conference on pattern recognition (ICPR2012), Tsukuba. IEEE, pp 3288\u20133291"},{"key":"9825_CR189","doi-asserted-by":"crossref","unstructured":"Shakeel MF, Bajwa NA, Anwaar AM et al (2019) Detecting driver drowsiness in real time through deep learning based object detection. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","DOI":"10.1007\/978-3-030-20521-8_24"},{"key":"9825_CR190","doi-asserted-by":"publisher","unstructured":"Sharma A, Muttoo SK (2018) Spatial image steganalysis based on ResNeXt. In: 2018 IEEE 18th International conference on communication technology, pp 1213\u20131216. https:\/\/doi.org\/10.1109\/icct.2018.8600132","DOI":"10.1109\/icct.2018.8600132"},{"key":"9825_CR191","doi-asserted-by":"publisher","first-page":"1510","DOI":"10.1109\/TMM.2017.2666540","volume":"19","author":"Y Shi","year":"2017","unstructured":"Shi Y, Tian Y, Wang Y, Huang T (2017) Sequential deep trajectory descriptor for action recognition with three-stream CNN. IEEE Trans Multimed 19:1510\u20131520","journal-title":"IEEE Trans Multimed"},{"key":"9825_CR192","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1109\/TMI.2016.2528162","volume":"35","author":"H-CC Shin","year":"2016","unstructured":"Shin H-CC, Roth HR, Gao M et al (2016) Deep convolutional neural networks for computer-aided detection: CNN architectures, dataset characteristics and transfer learning. IEEE Trans Med Imaging 35:1285\u20131298. https:\/\/doi.org\/10.1109\/TMI.2016.2528162","journal-title":"IEEE Trans Med Imaging"},{"key":"9825_CR193","unstructured":"Simard PY, Steinkraus D, Platt JC (2003) Best practices for convolutional neural networks applied to visual document analysis, p 958"},{"key":"9825_CR194","unstructured":"Simonyan K, Zisserman A (2014) Two-stream convolutional networks for action recognition in videos. In: Advances in neural information processing systems, pp 568\u2013576"},{"key":"9825_CR195","doi-asserted-by":"publisher","first-page":"398","DOI":"10.2146\/ajhp170251","volume":"75","author":"K Simonyan","year":"2015","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for large-scale image recognition. ICLR 75:398\u2013406. https:\/\/doi.org\/10.2146\/ajhp170251","journal-title":"ICLR"},{"key":"9825_CR196","doi-asserted-by":"publisher","unstructured":"Simonyan K, Vedaldi A, Zisserman A (2013) Deep inside convolutional networks: visualising image classification models and saliency maps, pp 1\u20138. https:\/\/doi.org\/10.1080\/00994480.2000.10748487","DOI":"10.1080\/00994480.2000.10748487"},{"key":"9825_CR197","doi-asserted-by":"publisher","unstructured":"Sinha T, Verma B, Haidar A (2018) Optimization of convolutional neural network parameters for image classification. In: 2017 IEEE symposium series on computational intelligence SSCI 2017, pp 1\u20137. https:\/\/doi.org\/10.1109\/ssci.2017.8285338","DOI":"10.1109\/ssci.2017.8285338"},{"key":"9825_CR198","doi-asserted-by":"publisher","first-page":"1455","DOI":"10.1109\/TBME.2015.2496264","volume":"63","author":"FA Spanhol","year":"2016","unstructured":"Spanhol FA, Oliveira LS, Petitjean C, Heutte L (2016a) A dataset for breast cancer histopathological image classification. IEEE Trans Biomed Eng 63:1455\u20131462","journal-title":"IEEE Trans Biomed Eng"},{"key":"9825_CR199","doi-asserted-by":"crossref","unstructured":"Spanhol FA, Oliveira LS, Petitjean C, Heutte L (2016b) Breast cancer histopathological image classification using convolutional neural networks. In: 2016 international joint conference on neural networks (IJCNN). IEEE, pp 2560\u20132567","DOI":"10.1109\/IJCNN.2016.7727519"},{"key":"9825_CR200","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3389\/frobt.2015.00036","volume":"2","author":"S Srinivas","year":"2016","unstructured":"Srinivas S, Sarvadevabhatla RK, Mopuri KR et al (2016) A taxonomy of deep convolutional neural nets for computer vision. Front Robot AI 2:1\u201313. https:\/\/doi.org\/10.3389\/frobt.2015.00036","journal-title":"Front Robot AI"},{"key":"9825_CR201","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.micromeso.2003.09.025","volume":"1","author":"N Srivastava","year":"2014","unstructured":"Srivastava N, Hinton G, Krizhevsky A et al (2014) Dropout: a simple way to prevent neural networks from overfittin. J Mach Learn Res 1:11. https:\/\/doi.org\/10.1016\/j.micromeso.2003.09.025","journal-title":"J Mach Learn Res"},{"key":"9825_CR202","doi-asserted-by":"publisher","unstructured":"Srivastava RK, Greff K, Schmidhuber J (2015a) Highway networks. https:\/\/doi.org\/10.1002\/esp.3417","DOI":"10.1002\/esp.3417"},{"key":"9825_CR203","unstructured":"Srivastava RK, Greff K, Schmidhuber J (2015b) Training very deep networks. In: Advances in neural information processing systems"},{"key":"9825_CR204","doi-asserted-by":"crossref","unstructured":"Stefanini M, Lancellotti R, Baraldi L, Calderara S (2019) A deep-learning-based approach to vm behavior identification in cloud systems. In: Proceedings of the 9th international conference on cloud computing and services science. SCITEPRESS\u2014Science and Technology Publications, pp 308\u2013315","DOI":"10.5220\/0007708403080315"},{"key":"9825_CR205","doi-asserted-by":"crossref","unstructured":"Strigl D, Kofler K, Podlipnig S (2010) Performance and scalability of GPU-based convolutional neural networks. In: 2010 18th Euromicro international conference on parallel, distributed and network-based processing (PDP), pp 317\u2013324","DOI":"10.1109\/PDP.2010.43"},{"key":"9825_CR206","doi-asserted-by":"crossref","unstructured":"Suganuma M, Shirakawa S, Nagao T (2017) A genetic programming approach to designing convolutional neural network architectures. In: Proceedings of the genetic and evolutionary computation conference. ACM, pp 497\u2013504","DOI":"10.1145\/3071178.3071229"},{"key":"9825_CR207","doi-asserted-by":"crossref","unstructured":"Sun L, Jia K, Yeung D-Y, Shi BE (2015) Human action recognition using factorized spatio-temporal convolutional networks. In: Proceedings of the IEEE international conference on computer vision, pp 4597\u20134605","DOI":"10.1109\/ICCV.2015.522"},{"key":"9825_CR208","doi-asserted-by":"crossref","unstructured":"Sundermeyer M, Schl\u00fcter R, Ney H (2012) LSTM neural networks for language modeling. In: Thirteenth annual conference of the international speech communication association","DOI":"10.21437\/Interspeech.2012-65"},{"key":"9825_CR209","doi-asserted-by":"crossref","unstructured":"Sze V, Chen YH, Yang TJ, Emer JS (2017) Efficient processing of deep neural networks: a tutorial and survey. In: Proceedings of IEEE","DOI":"10.1109\/JPROC.2017.2761740"},{"key":"9825_CR210","unstructured":"Szegedy C, Zaremba W, Sutskever I et al (2014) Intriguing properties of neural networks. In: 2nd international conference on learning Representations, ICLR 2014 - conference track proceedings"},{"key":"9825_CR211","doi-asserted-by":"crossref","unstructured":"Szegedy C, Liu W, Jia Y et al (2015) Going deeper with convolutions. In: 2015 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 1\u20139","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"9825_CR212","doi-asserted-by":"publisher","unstructured":"Szegedy C, Ioffe S, Vanhoucke V (2016a) Inception-v4, Inception-ResNet and the impact of residual connections on learning. Preprint arXiv:1602.07261v2 131:262\u2013263. https:\/\/doi.org\/10.1007\/s10236-015-0809-y","DOI":"10.1007\/s10236-015-0809-y"},{"key":"9825_CR213","doi-asserted-by":"crossref","unstructured":"Szegedy C, Vanhoucke V, Ioffe S et al (2016b) Rethinking the inception architecture for computer vision. In: Proceedings of the IEEE Computer Society conference on computer vision and pattern recognition. IEEE, pp 2818\u20132826","DOI":"10.1109\/CVPR.2016.308"},{"key":"9825_CR214","unstructured":"Targ S, Almeida D, Lyman K (2016) Resnet in Resnet: generalizing residual architectures. Preprint arXiv:1603.08029"},{"key":"9825_CR215","doi-asserted-by":"crossref","unstructured":"Tong W, Song L, Yang X, et al (2015) CNN-based shot boundary detection and video annotation. In: 2015 IEEE international symposium on broadband multimedia systems and broadcasting. IEEE, pp 1\u20135","DOI":"10.1109\/BMSB.2015.7177222"},{"key":"9825_CR216","doi-asserted-by":"crossref","unstructured":"Tong T, Li G, Liu X, Gao Q (2017) Image super-resolution using dense skip connections. In: 2017 IEEE international conference on computer vision (ICCV), pp 4809\u20134817","DOI":"10.1109\/ICCV.2017.514"},{"key":"9825_CR217","doi-asserted-by":"crossref","unstructured":"Tran D, Bourdev L, Fergus R, et al (2015) Learning spatiotemporal features with 3D convolutional networks. In: Proceedings of the IEEE international conference on computer vision, pp 4489\u20134497","DOI":"10.1109\/ICCV.2015.510"},{"key":"9825_CR218","doi-asserted-by":"publisher","first-page":"1155","DOI":"10.1109\/ACCESS.2017.2778011","volume":"6","author":"A Ullah","year":"2017","unstructured":"Ullah A, Ahmad J, Muhammad K et al (2017) Action recognition in video sequences using deep bi-directional LSTM with CNN features. IEEE Access 6:1155\u20131166","journal-title":"IEEE Access"},{"key":"9825_CR219","doi-asserted-by":"crossref","unstructured":"Vinayakumar R, Soman KP, Poornachandrany P (2017) Applying convolutional neural network for network intrusion detection. In: 2017 International conference on advances in computing, communications and informatics, ICACCI 2017","DOI":"10.1109\/ICACCI.2017.8126009"},{"key":"9825_CR220","doi-asserted-by":"crossref","unstructured":"Vincent P, Larochelle H, Bengio Y, Manzagol P-A (2008) Extracting and composing robust features with denoising autoencoders. In: Proceedings of the 25th international conference on machine learning. ACM, pp 1096\u20131103","DOI":"10.1145\/1390156.1390294"},{"key":"9825_CR221","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2587640","author":"O Vinyals","year":"2017","unstructured":"Vinyals O, Toshev A, Bengio S, Erhan D (2017) Show and tell: lessons learned from the 2015 MSCOCO image captioning challenge. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2016.2587640","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9825_CR222","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1016\/j.compbiomed.2017.04.012","volume":"85","author":"N Wahab","year":"2017","unstructured":"Wahab N, Khan A, Lee YS (2017) Two-phase deep convolutional neural network for reducing class skewness in histopathological images based breast cancer detection. Comput Biol Med 85:86\u201397. https:\/\/doi.org\/10.1016\/j.compbiomed.2017.04.012","journal-title":"Comput Biol Med"},{"key":"9825_CR223","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1093\/jmicro\/dfz002","volume":"68","author":"N Wahab","year":"2019","unstructured":"Wahab N, Khan A, Lee YS (2019) Transfer learning based deep CNN for segmentation and detection of mitoses in breast cancer histopathological images. Microscopy 68:216\u2013233. https:\/\/doi.org\/10.1093\/jmicro\/dfz002","journal-title":"Microscopy"},{"key":"9825_CR224","doi-asserted-by":"publisher","unstructured":"Wang H, Raj B (2017) On the origin of deep learning, pp 1\u201372. https:\/\/doi.org\/10.1016\/0014-5793(91)81229-2","DOI":"10.1016\/0014-5793(91)81229-2"},{"key":"9825_CR225","doi-asserted-by":"crossref","unstructured":"Wang H, Schmid C (2013) Action recognition with improved trajectories. In: Proceedings of the IEEE international conference on computer vision, pp 3551\u20133558","DOI":"10.1109\/ICCV.2013.441"},{"key":"9825_CR226","unstructured":"Wang T, Wu DJDJ, Coates A, Ng AY (2012) End-to-end text recognition with convolutional neural networks. In: International Conference on Pattern Recognition ICPR, pp 3304\u20133308"},{"key":"9825_CR227","doi-asserted-by":"crossref","unstructured":"Wang F, Jiang M, Qian C et al (2017a) Residual attention network for image classification. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 6450\u20136458","DOI":"10.1109\/CVPR.2017.683"},{"key":"9825_CR228","doi-asserted-by":"publisher","first-page":"510","DOI":"10.1109\/LSP.2016.2611485","volume":"24","author":"X Wang","year":"2017","unstructured":"Wang X, Gao L, Song J, Shen H (2017b) Beyond frame-level CNN: saliency-aware 3-D CNN With LSTM for video action recognition. IEEE Signal Process Lett 24:510\u2013514. https:\/\/doi.org\/10.1109\/LSP.2016.2611485","journal-title":"IEEE Signal Process Lett"},{"key":"9825_CR229","doi-asserted-by":"publisher","first-page":"31959","DOI":"10.1109\/ACCESS.2019.2903582","volume":"7","author":"Y Wang","year":"2019","unstructured":"Wang Y, Wang L, Wang H, Li P (2019) End-to-end image super-resolution via deep and shallow convolutional networks. IEEE Access 7:31959\u201331970. https:\/\/doi.org\/10.1109\/ACCESS.2019.2903582","journal-title":"IEEE Access"},{"key":"9825_CR230","doi-asserted-by":"publisher","unstructured":"Woo S, Park J, Lee JY, Kweon IS (2018) CBAM: Convolutional block attention module. Lect Notes Comput Sci (including Subser Lect Notes Artif Intell Lect Notes Bioinformatics) 11211 LNCS:3\u201319. https:\/\/doi.org\/10.1007\/978-3-030-01234-2_1","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"9825_CR231","doi-asserted-by":"crossref","unstructured":"Wu J, Leng C, Wang Y, et al (2016) Quantized convolutional neural networks for mobile devices. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2016.521"},{"key":"9825_CR232","doi-asserted-by":"crossref","unstructured":"Xie S, Girshick R, Dollar P et al (2017) Aggregated residual transformations for deep neural networks. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 5987\u20135995","DOI":"10.1109\/CVPR.2017.634"},{"key":"9825_CR233","doi-asserted-by":"crossref","unstructured":"Xie W, Zhang C, Zhang Y et al (2018) An energy-efficient FPGA-based embedded system for CNN application. In: 2018 IEEE international conference on electron devices and solid state circuits (EDSSC). IEEE, pp 1\u20132","DOI":"10.1109\/EDSSC.2018.8487057"},{"key":"9825_CR234","unstructured":"Xiong Y, Kim HJ, Hedau V (2019) ANTNets: mobile convolutional neural networks for resource efficient image classification. arXiv:190403775"},{"key":"9825_CR235","doi-asserted-by":"publisher","first-page":"O22","DOI":"10.1186\/1757-1146-1-S1-O22","volume":"1","author":"B Xu","year":"2015","unstructured":"Xu B, Wang N, Chen T, Li M (2015a) Empirical evaluation of rectified activations in convolutional network. J Foot Ankle Res 1:O22. https:\/\/doi.org\/10.1186\/1757-1146-1-S1-O22","journal-title":"J Foot Ankle Res"},{"key":"9825_CR236","unstructured":"Xu K, Ba J, Kiros R et al (2015b) Show, attend and tell: neural image caption generation with visual attention. In: International conference on machine learning, pp 2048\u20132057"},{"key":"9825_CR237","unstructured":"Yamada Y, Iwamura M, Kise K (2016) Deep pyramidal residual networks with separated stochastic depth. Preprint arXiv:1612.01230"},{"key":"9825_CR238","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TKDE.2009.191","volume":"1","author":"Q Yang","year":"2008","unstructured":"Yang Q, Pan SJ, Yang Q, Fellow QY (2008) A survey on transfer learning. IEEE Trans Knowl Data Eng 1:1\u201315. https:\/\/doi.org\/10.1109\/TKDE.2009.191","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"9825_CR239","doi-asserted-by":"crossref","unstructured":"Yang S, Luo P, Loy C-C, Tang X (2015) From facial parts responses to face detection: a deep learning approach. In: Proceedings of the IEEE international conference on computer visio, pp 3676\u20133684","DOI":"10.1109\/ICCV.2015.419"},{"key":"9825_CR240","doi-asserted-by":"publisher","first-page":"224","DOI":"10.1016\/j.patcog.2018.08.017","volume":"86","author":"J Yang","year":"2019","unstructured":"Yang J, Xiong W, Li S, Xu C (2019) Learning structured and non-redundant representations with deep neural networks. Pattern Recognit 86:224\u2013235","journal-title":"Pattern Recognit"},{"key":"9825_CR241","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2018.09.009","author":"\u00d6 Y\u0131ld\u0131r\u0131m","year":"2018","unstructured":"Y\u0131ld\u0131r\u0131m \u00d6, P\u0142awiak P, Tan RS, Acharya UR (2018) Arrhythmia detection using deep convolutional neural network with long duration ECG signals. Comput Biol Med. https:\/\/doi.org\/10.1016\/j.compbiomed.2018.09.009","journal-title":"Comput Biol Med"},{"key":"9825_CR242","doi-asserted-by":"crossref","unstructured":"Young SR, Rose DC, Karnowski TP et al (2015) Optimizing deep learning hyper-parameters through an evolutionary algorithm. In: Proceedings of the workshop on machine learning in high-performance computing environments. ACM, p 4","DOI":"10.1145\/2834892.2834896"},{"issue":"1-87","key":"9825_CR243","doi-asserted-by":"publisher","first-page":"12","DOI":"10.5244\/C.30.87","volume":"87","author":"S Zagoruyko","year":"2016","unstructured":"Zagoruyko S, Komodakis N (2016) Wide residual networks. Proc Br Mach Vis Conf 87(1-87):12. https:\/\/doi.org\/10.5244\/C.30.87","journal-title":"Proc Br Mach Vis Conf"},{"key":"9825_CR244","doi-asserted-by":"publisher","unstructured":"Zeiler MD, Fergus R (2013) Visualizing and understanding convolutional networks. Preprint arXiv:1311.2901v3, vol 30, pp 225\u2013231. https:\/\/doi.org\/10.1111\/j.1475-4932.1954.tb03086.x","DOI":"10.1111\/j.1475-4932.1954.tb03086.x"},{"key":"9825_CR245","unstructured":"Zhang X, LeCun Y (2015) Text understanding from scratch. Preprint arXiv:1502.01710"},{"key":"9825_CR246","doi-asserted-by":"publisher","first-page":"1499","DOI":"10.1109\/LSP.2016.2603342","volume":"23","author":"K Zhang","year":"2016","unstructured":"Zhang K, Zhang Z, Li Z et al (2016) Joint face detection and alignment using multitask cascaded convolutional networks. IEEE Signal Process Lett 23:1499\u20131503","journal-title":"IEEE Signal Process Lett"},{"key":"9825_CR247","doi-asserted-by":"publisher","unstructured":"Zhang X, Li Z, Loy CC, Lin D (2017) PolyNet: a pursuit of structural diversity in very deep networks. In: Proceedings of 30th IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2017, pp 3900\u20133908. https:\/\/doi.org\/10.1109\/cvpr.2017.415","DOI":"10.1109\/cvpr.2017.415"},{"key":"9825_CR248","doi-asserted-by":"crossref","unstructured":"Zhang X, Zhou X, Lin M, Sun J (2018a) ShuffleNet: an extremely efficient convolutional neural network for mobile devices. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2018.00716"},{"key":"9825_CR249","doi-asserted-by":"crossref","unstructured":"Zhang Y, Qiu Z, Yao T, et al (2018b) Fully convolutional adaptation networks for semantic segmentation. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2018.00712"},{"key":"9825_CR250","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/j.neucom.2018.09.038","volume":"323","author":"Q Zhang","year":"2019","unstructured":"Zhang Q, Zhang M, Chen T et al (2019) Recent advances in convolutional neural network acceleration. Neurocomputing 323:37\u201351. https:\/\/doi.org\/10.1016\/j.neucom.2018.09.038","journal-title":"Neurocomputing"},{"key":"9825_CR251","doi-asserted-by":"crossref","unstructured":"Zheng H, Fu J, Mei T, Luo J (2017) Learning multi-attention convolutional neural network for fine-grained image recognition. In: 2017 IEEE international conference on computer vision (ICCV), pp 5219\u20135227","DOI":"10.1109\/ICCV.2017.557"},{"key":"9825_CR252","doi-asserted-by":"crossref","unstructured":"Zhou B, Khosla A, Lapedriza A et al (2016) Learning deep features for discriminative localization. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2921\u20132929","DOI":"10.1109\/CVPR.2016.319"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09825-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-020-09825-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09825-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,30]],"date-time":"2023-09-30T04:52:48Z","timestamp":1696049568000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-020-09825-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,21]]},"references-count":252,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["9825"],"URL":"https:\/\/doi.org\/10.1007\/s10462-020-09825-6","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,4,21]]},"assertion":[{"value":"21 April 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}