{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T22:29:45Z","timestamp":1776983385083,"version":"3.51.4"},"reference-count":56,"publisher":"Springer Science and Business Media LLC","issue":"13","license":[{"start":{"date-parts":[[2021,1,4]],"date-time":"2021-01-04T00:00:00Z","timestamp":1609718400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,4]],"date-time":"2021-01-04T00:00:00Z","timestamp":1609718400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100007065","name":"Nvidia","doi-asserted-by":"publisher","award":["GPU- 900-1G611-2500-000T"],"award-info":[{"award-number":["GPU- 900-1G611-2500-000T"]}],"id":[{"id":"10.13039\/100007065","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Comput &amp; Applic"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1007\/s00521-020-05549-4","type":"journal-article","created":{"date-parts":[[2021,1,4]],"date-time":"2021-01-04T04:15:53Z","timestamp":1609733753000},"page":"8055-8065","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":33,"title":["AutoFCL: automatically tuning fully connected layers for handling small dataset"],"prefix":"10.1007","volume":"33","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8590-0897","authenticated-orcid":false,"given":"S. H. Shabbeer","family":"Basha","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sravan Kumar","family":"Vinakota","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shiv Ram","family":"Dubey","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Viswanath","family":"Pulabaigari","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Snehasis","family":"Mukherjee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,1,4]]},"reference":[{"key":"5549_CR1","first-page":"1106","volume":"25","author":"GE Hinton","year":"2012","unstructured":"Hinton GE, Krizhevsky A, Sutskever I (2012) Imagenet classification with deep convolutional neural networks. Adv Neural Inf Process Syst 25:1106\u20131114","journal-title":"Adv Neural Inf Process Syst"},{"key":"5549_CR2","doi-asserted-by":"crossref","unstructured":"Szegedy C, Liu W, Jia Y, Sermanet P, Reed S, Anguelov D, Erhan D, Vanhoucke V, Rabinovich A (2015) Going deeper with convolutions. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1\u20139","DOI":"10.1109\/CVPR.2015.7298594"},{"issue":"6","key":"5549_CR3","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","volume":"29","author":"G Hinton","year":"2012","unstructured":"Hinton G, Deng L, Yu D, Dahl G, Mohamed A-r, Jaitly N, Senior A, Vanhoucke V, Nguyen P, Sainath T, Kingsbury B (2012) Deep neural networks for acoustic modeling in speech recognition: the shared views of four research groups. IEEE Signal Process Mag 29(6):82\u201397","journal-title":"IEEE Signal Process Mag"},{"issue":"4","key":"5549_CR4","doi-asserted-by":"publisher","first-page":"278","DOI":"10.1109\/TETCI.2018.2829981","volume":"2","author":"M Wang","year":"2018","unstructured":"Wang M, Abdelfattah S, Moustafa N, Hu J (2018) Deep gaussian mixture-hidden markov model for classification of eeg signals. IEEE Trans Emerg Top Comput Intell 2(4):278\u2013287","journal-title":"IEEE Trans Emerg Top Comput Intell"},{"key":"5549_CR5","doi-asserted-by":"crossref","unstructured":"Zoph B, Vasudevan V, Shlens J, Le QV (2018) Learning transferable architectures for scalable image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 8697\u20138710","DOI":"10.1109\/CVPR.2018.00907"},{"key":"5549_CR6","doi-asserted-by":"crossref","unstructured":"Liu C, Zoph B, Neumann M, Shlens J, Hua W, Li L-J, Fei-Fei L, Yuille A, Huang J, Murphy K (2018) Progressive neural architecture search. In: Proceedings of the European conference on computer vision (ECCV), pp 19\u201334","DOI":"10.1007\/978-3-030-01246-5_2"},{"key":"5549_CR7","doi-asserted-by":"crossref","unstructured":"Elsken T, Metzen JH, Hutter F (2018) Neural architecture search: a survey. arXiv preprint arXiv:1808.05377","DOI":"10.1007\/978-3-030-05318-5_3"},{"key":"5549_CR8","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.imavis.2019.06.005","volume":"89","author":"Y Jaafra","year":"2019","unstructured":"Jaafra Y, Laurent JL, Deruyver A, Naceur MS (2019) Reinforcement learning for neural architecture search: a review. Image Vis Comput 89:57\u201366","journal-title":"Image Vis Comput"},{"key":"5549_CR9","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.neucom.2019.10.008","volume":"378","author":"SHS Basha","year":"2019","unstructured":"Basha SHS, Dubey SR, Pulabaigari V, Mukherjee S (2019) Impact of fully connected layers on performance of convolutional neural networks for image classification. Neurocomputing 378:112\u2013119","journal-title":"Neurocomputing"},{"key":"5549_CR10","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li L-J, Li K, Fei-Fei L (2009) Imagenet: A large-scale hierarchical image database. In: Computer vision and pattern recognition (CVPR) 2009. IEEE Conference on IEEE, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"5549_CR11","doi-asserted-by":"crossref","unstructured":"Zeiler MD, and Fergus R (2014) Visualizing and understanding convolutional networks. In: European conference on computer vision, Springer, pp 818\u2013833","DOI":"10.1007\/978-3-319-10590-1_53"},{"key":"5549_CR12","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"5549_CR13","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"5549_CR14","doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Van Der Maaten L, Weinberger KQ (2017) Densely connected convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4700\u20134708","DOI":"10.1109\/CVPR.2017.243"},{"key":"5549_CR15","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.neucom.2018.03.080","volume":"328","author":"Q Xu","year":"2019","unstructured":"Xu Q, Zhang M, Gu Z, Pan G (2019) Overfitting remedy by sparsifying regularization on fully-connected layers of cnns. Neurocomputing 328:69\u201374","journal-title":"Neurocomputing"},{"key":"5549_CR16","unstructured":"Mendoza H, Klein A, Feurer M, Springenberg JT, Hutter F (2016) Towards automatically-tuned neural networks. In: Workshop on automatic machine learning, pp 58\u201365"},{"key":"5549_CR17","doi-asserted-by":"crossref","unstructured":"Szegedy C, Vanhoucke V, Ioffe S, Shlens J, Wojna Z (2016) Rethinking the inception architecture for computer vision. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2818\u20132826","DOI":"10.1109\/CVPR.2016.308"},{"key":"5549_CR18","unstructured":"Howard AG, Zhu M, Chen B, Kalenichenko D, Wang W, Weyand T, Andreetto M, Adam H (2017) Mobilenets: efficient convolutional neural networks for mobile vision applications. arXiv preprint arXiv:1704.04861"},{"key":"5549_CR19","doi-asserted-by":"crossref","unstructured":"Ng H-W, Nguyen VD, Vonikakis V, Winkler S (2015) Deep learning for emotion recognition on small datasets using transfer learning. In: Proceedings of the 2015 ACM on international conference on multimodal interaction. ACM, pp 443\u2013449","DOI":"10.1145\/2818346.2830593"},{"key":"5549_CR20","unstructured":"Frazier PI (2018) A tutorial on bayesian optimization. arXiv preprint arXiv:1807.02811"},{"issue":"3","key":"5549_CR21","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky O, Deng J, Su H, Krause J, Satheesh S, Ma S, Huang Z, Karpathy A, Khosla A, Bernstein M, Berg AC, Fei-Fei L (2015) ImageNet large scale visual recognition challenge. Int J Comput Vis (IJCV) 115(3):211\u2013252","journal-title":"Int J Comput Vis (IJCV)"},{"key":"5549_CR22","doi-asserted-by":"publisher","first-page":"103853","DOI":"10.1016\/j.imavis.2019.103853","volume":"93","author":"X Li","year":"2020","unstructured":"Li X, Grandvalet Y, Davoine F, Cheng J, Cui Y, Zhang H, Belongie S, Tsai Y-H, Yang M-H (2020) Transfer learning in computer vision tasks: remember where you come from. Image Vis Comput 93:103853","journal-title":"Image Vis Comput"},{"key":"5549_CR23","doi-asserted-by":"publisher","first-page":"48","DOI":"10.1016\/j.imavis.2016.08.007","volume":"60","author":"J Hu","year":"2017","unstructured":"Hu J (2017) Discriminative transfer learning with sparsity regularization for single-sample face recognition. Image Vis Comput 60:48\u201357","journal-title":"Image Vis Comput"},{"key":"5549_CR24","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.eswa.2017.11.028","volume":"95","author":"D Han","year":"2018","unstructured":"Han D, Liu Q, Fan W (2018) A new image classification method using cnn transfer learning and web data augmentation. Expert Syst Appl 95:43\u201356","journal-title":"Expert Syst Appl"},{"issue":"Jul","key":"5549_CR25","first-page":"2121","volume":"12","author":"J Duchi","year":"2011","unstructured":"Duchi J, Hazan E, Singer Y (2011) Adaptive subgradient methods for online learning and stochastic optimization. J Mach Learn Res 12(Jul):2121\u20132159","journal-title":"J Mach Learn Res"},{"key":"5549_CR26","unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980"},{"key":"5549_CR27","unstructured":"Wistuba M (2017) Bayesian optimization combined with successive halving for neural network architecture optimization. In: AutoML@ PKDD\/ECML , pp 2\u201311"},{"issue":"5","key":"5549_CR28","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1109\/TETCI.2018.2868326","volume":"3","author":"D Ji","year":"2019","unstructured":"Ji D, Jiang Y, Qian P, Wang S (2019) A novel doubly reweighting multisource transfer learning framework. IEEE Trans Emerg Top Comput Intell 3(5):380\u2013391","journal-title":"IEEE Trans Emerg Top Comput Intell"},{"issue":"1","key":"5549_CR29","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1109\/TETCI.2017.2769104","volume":"2","author":"A Gupta","year":"2017","unstructured":"Gupta A, Ong Y-S, Feng L (2017) Insights on transfer optimization: because experience is the best teacher. IEEE Trans Emerg Top Comput Intell 2(1):51\u201364","journal-title":"IEEE Trans Emerg Top Comput Intell"},{"key":"5549_CR30","unstructured":"Yosinski J, Clune J, Bengio Y, Lipson H (2014) How transferable are features in deep neural networks?. In: Advances in neural information processing systems, pp 3320\u20133328"},{"key":"5549_CR31","doi-asserted-by":"crossref","unstructured":"Xie M, Jean N, Burke M, Lobell D, Ermon S (2016) Transfer learning from deep features for remote sensing and poverty mapping. In: 13th AAAI conference on artificial intelligence","DOI":"10.1609\/aaai.v30i1.9906"},{"key":"5549_CR32","unstructured":"Molchanov P, Tyree S, Karras T, Aila T, Kautz J (2016) Pruning convolutional neural networks for resource efficient transfer learning, vol 3. arXiv preprint arXiv:1611.06440"},{"key":"5549_CR33","unstructured":"Snoek J, Larochelle H, Adams RP (2012) Practical Bayesian optimization of machine learning algorithms. In: Advances in neural information processing systems, pp 2951\u20132959"},{"key":"5549_CR34","volume-title":"Gaussian processes for machine learning","author":"CK Williams","year":"2006","unstructured":"Williams CK, Rasmussen CE (2006) Gaussian processes for machine learning, vol 2. MIT press, Cambridge, MA"},{"key":"5549_CR35","first-page":"63","volume-title":"Summer school on machine learning","author":"CE Rasmussen","year":"2003","unstructured":"Rasmussen CE (2003) Gaussian processes in machine learning. In: Summer school on machine learning. Springer, Berlin, Heidelberg, pp 63\u201371"},{"issue":"4","key":"5549_CR36","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1023\/A:1008306431147","volume":"13","author":"DR Jones","year":"1998","unstructured":"Jones DR, Schonlau M, Welch WJ (1998) Efficient global optimization of expensive black-box functions. J Glob Optim 13(4):455\u2013492","journal-title":"J Glob Optim"},{"key":"5549_CR37","unstructured":"Ioffe S, Szegedy C (2015) Batch normalization: accelerating deep network training by reducing internal covariate shift. arXiv preprint arXiv:1502.03167"},{"key":"5549_CR38","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Delving deep into rectifiers: surpassing human-level performance on imagenet classification. In: Proceedings of the IEEE international conference on computer vision, pp 1026\u20131034","DOI":"10.1109\/ICCV.2015.123"},{"issue":"10","key":"5549_CR39","doi-asserted-by":"publisher","first-page":"947","DOI":"10.2514\/8.5282","volume":"30","author":"HJ Kelley","year":"1960","unstructured":"Kelley HJ (1960) Gradient theory of optimal flight paths. Ars J 30(10):947\u2013954","journal-title":"Ars J"},{"issue":"4","key":"5549_CR40","doi-asserted-by":"publisher","first-page":"594","DOI":"10.1109\/TPAMI.2006.79","volume":"28","author":"L Fei-Fei","year":"2006","unstructured":"Fei-Fei L, Fergus R, Perona P (2006) One-shot learning of object categories. IEEE Trans Pattern Anal Mach Intell 28(4):594\u2013611","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"5549_CR41","doi-asserted-by":"crossref","unstructured":"Nilsback M-E, Zisserman A (2008) Automated flower classification over a large number of classes. In: Proceedings of the Indian conference on computer vision, graphics and image processing, Dec","DOI":"10.1109\/ICVGIP.2008.47"},{"key":"5549_CR42","doi-asserted-by":"crossref","unstructured":"Yang Y, Newsam S (2010) Bag-of-visual-words and spatial extensions for land-use classification. In: Proceedings of the 18th SIGSPATIAL international conference on advances in geographic information systems. ACM, pp 270\u2013279","DOI":"10.1145\/1869790.1869829"},{"key":"5549_CR43","doi-asserted-by":"crossref","unstructured":"Lee H, Grosse R, Ranganath R, Ng AY (2009) Convolutional deep belief networks for scalable unsupervised learning of hierarchical representations. In: Proceedings of the 26th annual international conference on machine learning. ACM, pp 609\u2013616","DOI":"10.1145\/1553374.1553453"},{"key":"5549_CR44","doi-asserted-by":"crossref","unstructured":"Cubuk ED, Zoph B, Mane D, Vasudevan V, and Le QV (2019) Autoaugment: learning augmentation strategies from data. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 113\u2013123","DOI":"10.1109\/CVPR.2019.00020"},{"issue":"1","key":"5549_CR45","doi-asserted-by":"publisher","first-page":"128","DOI":"10.3390\/app9010128","volume":"9","author":"Y Sawada","year":"2019","unstructured":"Sawada Y, Sato Y, Nakada T, Yamaguchi S, Ujimoto K, Hayashi N (2019) Improvement in classification performance based on target vector modification for all-transfer deep learning. Appl Sci 9(1):128","journal-title":"Appl Sci"},{"key":"5549_CR46","doi-asserted-by":"crossref","unstructured":"Huang B, Hu Y, Sun Y, Hao X, Yan C (2018) A flower classification framework based on ensemble of CNNS. In: Pacific Rim Conference on Multimedia, Springer, pp 235\u2013244","DOI":"10.1007\/978-3-030-00764-5_22"},{"key":"5549_CR47","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1016\/j.patrec.2017.09.026","volume":"109","author":"X Lv","year":"2018","unstructured":"Lv X, Duan F (2018) Metric learning via feature weighting for scalable image retrieval. Pattern Recognit Lett 109:97\u2013102","journal-title":"Pattern Recognit Lett"},{"key":"5549_CR48","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1016\/j.cviu.2018.03.005","volume":"172","author":"F Murabito","year":"2018","unstructured":"Murabito F, Spampinato C, Palazzo S, Giordano D, Pogorelov K, Riegler M (2018) Top-down saliency detection driven by visual classification. Comput Vis Image Underst 172:67\u201376","journal-title":"Comput Vis Image Underst"},{"key":"5549_CR49","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2885764","author":"M Simon","year":"2018","unstructured":"Simon M, Rodner E, Darrell T, Denzler J (2018) The whole is more than its parts? From explicit to implicit pose normalization. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2018.2885764","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"5549_CR50","doi-asserted-by":"crossref","unstructured":"Karlinsky L, Shtok J, Harary S, Schwartz E, Aides A, Feris R, Giryes R, Bronstein AM (2019) Repmet: representative-based metric learning for classification and few-shot object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5197\u20135206","DOI":"10.1109\/CVPR.2019.00534"},{"key":"5549_CR51","doi-asserted-by":"crossref","unstructured":"Shao W, Yang W, Xia G-S, Liu G (2013) A hierarchical scheme of multiple feature fusion for high-resolution satellite scene categorization. In: International conference on computer vision systems, Springer, pp 324\u2013333","DOI":"10.1007\/978-3-642-39402-7_33"},{"key":"5549_CR52","doi-asserted-by":"crossref","unstructured":"Yang MY, Al-Shaikhli S, Jiang T, Cao Y, Rosenhahn B (2016) Bi-layer dictionary learning for remote sensing image classification. In: IEEE International geoscience and remote sensing symposium (IGARSS), pp 3059\u20133062","DOI":"10.1109\/IGARSS.2016.7729791"},{"key":"5549_CR53","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1016\/j.ins.2018.07.074","volume":"467","author":"T Akram","year":"2018","unstructured":"Akram T, Laurent B, Naqvi SR, Alex MM, Muhammad N et al (2018) A deep heterogeneous feature fusion approach for automatic land-use classification. Inf Sci 467:199\u2013218","journal-title":"Inf Sci"},{"issue":"6","key":"5549_CR54","doi-asserted-by":"publisher","first-page":"1130","DOI":"10.3390\/app9061130","volume":"9","author":"EK Wang","year":"2019","unstructured":"Wang EK, Li Y, Nie Z, Yu J, Liang Z, Zhang X, Yiu SM (2019) Deep fusion feature based object detection method for high resolution optical remote sensing images. Appl Sci 9(6):1130","journal-title":"Appl Sci"},{"issue":"11","key":"5549_CR55","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun Y, Bottou L, Bengio Y, Haffner P et al (1998) Gradient-based learning applied to document recognition. Proc IEEE 86(11):2278\u20132324","journal-title":"Proc IEEE"},{"key":"5549_CR56","unstructured":"Krizhevsky A, Hinton G (2009) Learning multiple layers of features from tiny images"}],"container-title":["Neural Computing and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-020-05549-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00521-020-05549-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-020-05549-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,10]],"date-time":"2022-12-10T09:19:49Z","timestamp":1670663989000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00521-020-05549-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,4]]},"references-count":56,"journal-issue":{"issue":"13","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["5549"],"URL":"https:\/\/doi.org\/10.1007\/s00521-020-05549-4","relation":{},"ISSN":["0941-0643","1433-3058"],"issn-type":[{"value":"0941-0643","type":"print"},{"value":"1433-3058","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,1,4]]},"assertion":[{"value":"2 April 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 November 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 January 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with ethical standards"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}