{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,8]],"date-time":"2025-10-08T16:29:37Z","timestamp":1759940977355,"version":"3.37.3"},"reference-count":52,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2024,3,14]],"date-time":"2024-03-14T00:00:00Z","timestamp":1710374400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,3,14]],"date-time":"2024-03-14T00:00:00Z","timestamp":1710374400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100007065","name":"NVidia","doi-asserted-by":"crossref","id":[{"id":"10.13039\/100007065","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"published-print":{"date-parts":[[2024,4]]},"DOI":"10.1007\/s00530-024-01271-6","type":"journal-article","created":{"date-parts":[[2024,3,14]],"date-time":"2024-03-14T17:02:03Z","timestamp":1710435723000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Target aware network architecture search and compression for efficient knowledge transfer"],"prefix":"10.1007","volume":"30","author":[{"given":"S. H. Shabbeer","family":"Basha","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Debapriya","family":"Tula","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sravan Kumar","family":"Vinakota","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shiv Ram","family":"Dubey","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,3,14]]},"reference":[{"issue":"7553","key":"1271_CR1","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436\u2013444 (2015)","journal-title":"Nature"},{"key":"1271_CR2","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., Shlens, J., Wojna, Z.: Rethinking the inception architecture for computer vision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2818\u20132826 (2016)","DOI":"10.1109\/CVPR.2016.308"},{"key":"1271_CR3","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"55","key":"1271_CR4","first-page":"1","volume":"20","author":"T Elsken","year":"2019","unstructured":"Elsken, T., Metzen, J.H., Hutter, F.: Neural architecture search: a survey. J. Mach. Learn. Res. 20(55), 1\u201321 (2019)","journal-title":"J. Mach. Learn. Res."},{"key":"1271_CR5","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., Fei-Fei, L.: Imagenet: A large-scale hierarchical image database. In: IEEE Conference on Computer Vision and Pattern Recognition, 2009. CVPR 2009. pp. 248\u2013255. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"1271_CR6","unstructured":"Krizhevsky, A., Hinton, G., et al.: Learning multiple layers of features from tiny images (2009)"},{"issue":"10","key":"1271_CR7","doi-asserted-by":"publisher","first-page":"6469","DOI":"10.1007\/s00521-018-3468-3","volume":"31","author":"Z Yang","year":"2019","unstructured":"Yang, Z., Yu, W., Liang, P., Guo, H., Xia, L., Zhang, F., Ma, Y., Ma, J.: Deep transfer learning for military object recognition under small training set condition. Neural Comput. Appl. 31(10), 6469\u20136478 (2019)","journal-title":"Neural Comput. Appl."},{"key":"1271_CR8","unstructured":"Frazier, P.I.: A tutorial on bayesian optimization. arXiv preprint arXiv:1807.02811 (2018)"},{"issue":"5","key":"1271_CR9","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1109\/TMI.2016.2528162","volume":"35","author":"H-C Shin","year":"2016","unstructured":"Shin, H.-C., Roth, H.R., Gao, M., Lu, L., Xu, Z., Nogues, I., Yao, J., Mollura, D., Summers, R.M.: Deep convolutional neural networks for computer-aided detection: Cnn architectures, dataset characteristics and transfer learning. IEEE Trans. Med. Imaging 35(5), 1285\u20131298 (2016)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"1271_CR10","doi-asserted-by":"publisher","first-page":"202","DOI":"10.1016\/j.neunet.2020.01.017","volume":"124","author":"S Raghu","year":"2020","unstructured":"Raghu, S., Sriraam, N., Temel, Y., Rao, S.V., Kubben, P.L.: Eeg based multi-class seizure type classification using convolutional neural network and transfer learning. Neural Netw. 124, 202\u2013212 (2020)","journal-title":"Neural Netw."},{"key":"1271_CR11","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.compag.2018.02.016","volume":"147","author":"A Kamilaris","year":"2018","unstructured":"Kamilaris, A., Prenafeta-Bold\u00fa, F.X.: Deep learning in agriculture: a survey. Comput. Electron. Agric. 147, 70\u201390 (2018)","journal-title":"Comput. Electron. Agric."},{"issue":"1","key":"1271_CR12","doi-asserted-by":"publisher","first-page":"571","DOI":"10.1007\/s10489-020-01826-w","volume":"51","author":"S Ahuja","year":"2021","unstructured":"Ahuja, S., Panigrahi, B.K., Dey, N., Rajinikanth, V., Gandhi, T.K.: Deep transfer learning-based automated detection of COVID-19 from lung CT scan slices. Appl. Intell. 51(1), 571\u2013585 (2021)","journal-title":"Appl. Intell."},{"key":"1271_CR13","unstructured":"Molchanov, P., Tyree, S., Karras, T., Aila, T., Kautz, J.: Pruning convolutional neural networks for resource efficient transfer learning. arXiv preprint arXiv:1611.064403 (2016)"},{"key":"1271_CR14","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.eswa.2017.11.028","volume":"95","author":"D Han","year":"2018","unstructured":"Han, D., Liu, Q., Fan, W.: A new image classification method using cnn transfer learning and web data augmentation. Expert Syst. Appl. 95, 43\u201356 (2018)","journal-title":"Expert Syst. Appl."},{"key":"1271_CR15","unstructured":"Yosinski, J., Clune, J., Bengio, Y., Lipson, H.: How transferable are features in deep neural networks? In: Advances in Neural Information Processing Systems, pp. 3320\u20133328 (2014)"},{"key":"1271_CR16","unstructured":"Bergstra, J.S., Bardenet, R., Bengio, Y., K\u00e9gl, B.: Algorithms for hyper-parameter optimization. In: Advances in Neural Information Processing Systems, pp. 2546\u20132554 (2011)"},{"key":"1271_CR17","unstructured":"Snoek, J., Larochelle, H., Adams, R.P.: Practical bayesian optimization of machine learning algorithms. In: Advances in Neural Information Processing Systems, pp. 2951\u20132959 (2012)"},{"key":"1271_CR18","unstructured":"Zoph, B., Le, Q.V.: Neural architecture search with reinforcement learning. arXiv preprint arXiv:1611.01578 (2016)"},{"key":"1271_CR19","doi-asserted-by":"crossref","unstructured":"Zoph, B., Vasudevan, V., Shlens, J., Le, Q.V.: Learning transferable architectures for scalable image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8697\u20138710 (2018)","DOI":"10.1109\/CVPR.2018.00907"},{"key":"1271_CR20","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1016\/j.neunet.2019.12.005","volume":"123","author":"J Jiang","year":"2020","unstructured":"Jiang, J., Han, F., Ling, Q., Wang, J., Li, T., Han, H.: Efficient network architecture search via multiobjective particle swarm optimization based on decomposition. Neural Netw. 123, 305\u2013316 (2020)","journal-title":"Neural Netw."},{"key":"1271_CR21","unstructured":"Chen, W., Wilson, J., Tyree, S., Weinberger, K., Chen, Y.: Compressing neural networks with the hashing trick. In: International Conference on Machine Learning, pp. 2285\u20132294 (2015)"},{"key":"1271_CR22","unstructured":"Han, S., Mao, H., Dally, W.J.: Deep compression: Compressing deep neural networks with pruning, trained quantization and huffman coding. arXiv preprint arXiv:1510.00149 (2015)"},{"key":"1271_CR23","doi-asserted-by":"crossref","unstructured":"Rastegari, M., Ordonez, V., Redmon, J., Farhadi, A.: Xnor-net: Imagenet classification using binary convolutional neural networks. In: European Conference on Computer Vision, pp. 525\u2013542. Springer (2016)","DOI":"10.1007\/978-3-319-46493-0_32"},{"key":"1271_CR24","unstructured":"Polino, A., Pascanu, R., Alistarh, D.: Model compression via distillation and quantization. arXiv preprint arXiv:1802.05668 (2018)"},{"key":"1271_CR25","doi-asserted-by":"crossref","unstructured":"Singh, P., Verma, V.K., Rai, P., Namboodiri, V.: Leveraging filter correlations for deep model compression. In: The IEEE Winter Conference on Applications of Computer Vision, pp. 835\u2013844 (2020)","DOI":"10.1109\/WACV45572.2020.9093331"},{"key":"1271_CR26","doi-asserted-by":"crossref","unstructured":"Lin, M., Ji, R., Wang, Y., Zhang, Y., Zhang, B., Tian, Y., Shao, L.: Hrank: Filter pruning using high-rank feature map. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1529\u20131538 (2020)","DOI":"10.1109\/CVPR42600.2020.00160"},{"issue":"10","key":"1271_CR27","doi-asserted-by":"publisher","first-page":"7016","DOI":"10.1007\/s10489-020-01968-x","volume":"51","author":"Y Fan","year":"2021","unstructured":"Fan, Y., Pang, W., Lu, S.: Hfpq: deep neural network compression by hardware-friendly pruning-quantization. Appl. Intell. 51(10), 7016\u20137028 (2021)","journal-title":"Appl. Intell."},{"key":"1271_CR28","unstructured":"Li, H., Kadav, A., Durdanovic, I., Samet, H., Graf, H.P.: Pruning filters for efficient convnets. arXiv preprint arXiv:1608.08710 (2016)"},{"issue":"1","key":"1271_CR29","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1186\/s40537-016-0043-6","volume":"3","author":"K Weiss","year":"2016","unstructured":"Weiss, K., Khoshgoftaar, T.M., Wang, D.: A survey of transfer learning. J. Big data 3(1), 9 (2016)","journal-title":"J. Big data"},{"issue":"13","key":"1271_CR30","doi-asserted-by":"publisher","first-page":"8055","DOI":"10.1007\/s00521-020-05549-4","volume":"33","author":"SS Basha","year":"2021","unstructured":"Basha, S.S., Vinakota, S.K., Dubey, S.R., Pulabaigari, V., Mukherjee, S.: Autofcl: automatically tuning fully connected layers for handling small dataset. Neural Comput. Appl. 33(13), 8055\u201365 (2021)","journal-title":"Neural Comput. Appl."},{"key":"1271_CR31","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.neunet.2020.10.009","volume":"133","author":"SS Basha","year":"2021","unstructured":"Basha, S.S., Vinakota, S.K., Pulabaigari, V., Mukherjee, S., Dubey, S.R.: Autotune: Automatically tuning convolutional neural networks for improved transfer learning. Neural Netw. 133, 112\u2013122 (2021)","journal-title":"Neural Netw."},{"key":"1271_CR32","doi-asserted-by":"crossref","unstructured":"Rasmussen, C.E.: Gaussian processes in machine learning. In: Summer School on Machine Learning, pp. 63\u201371. Springer (2003)","DOI":"10.1007\/978-3-540-28650-9_4"},{"key":"1271_CR33","unstructured":"Basha, S., Farazuddin, M., Pulabaigari, V., Dubey, S.R., Mukherjee, S.: Deep model compression based on the training history. arXiv preprint arXiv:2102.00160 (2021)"},{"key":"1271_CR34","unstructured":"Phan, T.H., Yamamoto, K.: Resolving class imbalance in object detection with weighted cross entropy losses. arXiv preprint arXiv:2006.01413 (2020)"},{"key":"1271_CR35","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"1271_CR36","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, Z., Van Der\u00a0Maaten, L., Weinberger, K.Q.: Densely connected convolutional networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4700\u20134708 (2017)","DOI":"10.1109\/CVPR.2017.243"},{"issue":"11","key":"1271_CR37","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition. Proc. IEEE 86(11), 2278\u20132324 (1998)","journal-title":"Proc. IEEE"},{"key":"1271_CR38","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. In: Advances in Neural Information Processing Systems, pp. 1097\u20131105 (2012)"},{"issue":"1","key":"1271_CR39","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.: Dropout: a simple way to prevent neural networks from overfitting. J. Mach. Learn. Res. 15(1), 1929\u20131958 (2014)","journal-title":"J. Mach. Learn. Res."},{"issue":"10","key":"1271_CR40","doi-asserted-by":"publisher","first-page":"6179","DOI":"10.1007\/s00521-018-3432-2","volume":"31","author":"G Qian","year":"2019","unstructured":"Qian, G., Zhang, L., Wang, Y.: Single-label and multi-label conceptor classifiers in pre-trained neural networks. Neural Comput. Appl. 31(10), 6179\u20136188 (2019)","journal-title":"Neural Comput. Appl."},{"key":"1271_CR41","doi-asserted-by":"crossref","unstructured":"Shah, M.A., Raj, B.: Deriving compact feature representations via annealed contraction. In: ICASSP 2020-2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2068\u20132072. IEEE (2020)","DOI":"10.1109\/ICASSP40776.2020.9054527"},{"key":"1271_CR42","doi-asserted-by":"crossref","unstructured":"Gadosey, P.K., Li, Y., Yamak, P.T.: On pruned, quantized and compact cnn architectures for vision applications: an empirical study. In: Proceedings of the International Conference on Artificial Intelligence, Information Processing and Cloud Computing, pp. 1\u20138 (2019)","DOI":"10.1145\/3371425.3371481"},{"key":"1271_CR43","doi-asserted-by":"crossref","unstructured":"Liu, B., Cai, Y., Guo, Y., Chen, X.: Transtailor: Pruning the pre-trained model for improved transfer learning. arXiv preprint arXiv:2103.01542 (2021)","DOI":"10.1609\/aaai.v35i10.17046"},{"key":"1271_CR44","doi-asserted-by":"crossref","unstructured":"Xie, Z., Wen, Z., Liu, J., Liu, Z., Wu, X., Tan, M.: Deep transferring quantization. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part VIII 16, pp. 625\u2013642. Springer (2020)","DOI":"10.1007\/978-3-030-58598-3_37"},{"key":"1271_CR45","first-page":"2121","volume":"12","author":"J Duchi","year":"2011","unstructured":"Duchi, J., Hazan, E., Singer, Y.: Adaptive subgradient methods for online learning and stochastic optimization. J. Mach. Learn. Res. 12, 2121\u20132159 (2011)","journal-title":"J. Mach. Learn. Res."},{"key":"1271_CR46","unstructured":"Fei-Fei, L., Fergus, R., Perona, P.: Learning generative visual models from few training examples: An incremental bayesian approach tested on 101 object categories. In: 2004 Conference on Computer Vision and Pattern Recognition Workshop, pp. 178\u2013178. IEEE (2004)"},{"key":"1271_CR47","unstructured":"Griffin, G., Holub, A., Perona, P.: Caltech-256 object category dataset (2007)"},{"key":"1271_CR48","unstructured":"Khosla, A., Jayadevaprakash, N., Yao, B., Li, F.-F.: Novel dataset for fine-grained image categorization: Stanford dogs. In: Proc. CVPR Workshop on Fine-Grained Visual Categorization (FGVC), vol. 2 (2011)"},{"key":"1271_CR49","doi-asserted-by":"crossref","unstructured":"Lang, K.: Newsweeder: Learning to filter netnews. In: Machine Learning Proceedings 1995, pp. 331\u2013339. Elsevier (1995)","DOI":"10.1016\/B978-1-55860-377-6.50048-7"},{"key":"1271_CR50","unstructured":"Maas, A., Daly, R.E., Pham, P.T., Huang, D., Ng, A.Y., Potts, C.: Learning word vectors for sentiment analysis. In: Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, pp. 142\u2013150 (2011)"},{"key":"1271_CR51","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.D.: Glove: Global vectors for word representation. In: Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 1532\u20131543 (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"1271_CR52","doi-asserted-by":"crossref","unstructured":"Kim, Y.: Convolutional neural networks for sentence classification. arXiv preprint arXiv:1408.5882 (2014)","DOI":"10.3115\/v1\/D14-1181"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01271-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00530-024-01271-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-024-01271-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,12]],"date-time":"2024-04-12T13:12:42Z","timestamp":1712927562000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00530-024-01271-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,14]]},"references-count":52,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2024,4]]}},"alternative-id":["1271"],"URL":"https:\/\/doi.org\/10.1007\/s00530-024-01271-6","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"type":"print","value":"0942-4962"},{"type":"electronic","value":"1432-1882"}],"subject":[],"published":{"date-parts":[[2024,3,14]]},"assertion":[{"value":"21 March 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 January 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 March 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"We declare the following conflicts of interest, 1. Indian Institute of Information Technology Sri City, Chittoor, India. 2. Lytx India Technologies Private Limited, Bangalore. 3. RV University Bangalore, India. 4. Tata Consultancy Services, Hyderabad, India. 5. New Jersey Institute of Technology, New Jersey, USA. 6. Google Research Bangalore, India. 7. Indian Institute of Information Technology Allahabad, India.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"81"}}