{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T12:48:47Z","timestamp":1743079727941,"version":"3.40.3"},"publisher-location":"Cham","reference-count":27,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031127472"},{"type":"electronic","value":"9783031127489"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-12748-9_4","type":"book-chapter","created":{"date-parts":[[2022,7,29]],"date-time":"2022-07-29T14:29:33Z","timestamp":1659104973000},"page":"45-56","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Dynamic Pruning for\u00a0Parsimonious CNN Inference on\u00a0Embedded Systems"],"prefix":"10.1007","author":[{"given":"Paola","family":"Busia","sequence":"first","affiliation":[]},{"given":"Ilias","family":"Theodorakopoulos","sequence":"additional","affiliation":[]},{"given":"Vasileios","family":"Pothos","sequence":"additional","affiliation":[]},{"given":"Nikos","family":"Fragoulis","sequence":"additional","affiliation":[]},{"given":"Paolo","family":"Meloni","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,7,30]]},"reference":[{"key":"4_CR1","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521, 436\u2013444 (2015)","journal-title":"Nature"},{"key":"4_CR2","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition (2015)","DOI":"10.1109\/CVPR.2016.90"},{"key":"4_CR3","doi-asserted-by":"publisher","unstructured":"Jouppi, N.P., et\u00a0al.: In-datacenter performance analysis of a tensor processing unit. In: ISCA 2017: Proceedings of the 44th Annual International Symposium on Computer Architecture, pp. 1\u201312, June 2017. https:\/\/doi.org\/10.1145\/3079856.3080246","DOI":"10.1145\/3079856.3080246"},{"issue":"2","key":"4_CR4","doi-asserted-by":"publisher","first-page":"420","DOI":"10.1109\/TPDS.2017.2752706","volume":"22","author":"E Azarkhish","year":"2018","unstructured":"Azarkhish, E., Rossi, D., Loi, I., Benini, L.: Neurostream: scalable and energy efficient deep learning with smart memory cubes. IEEE Trans. Parallel Distrib. Syst. 22(2), 420\u2013434 (2018)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"4_CR5","doi-asserted-by":"crossref","unstructured":"Desoli, G., et\u00a0al.: 14.1 a 2.9TOPS\/W deep convolutional neural network SoC in FD-SOI 28 nm for intelligent embedded systems. In: 2017 IEEE International Solid-State Circuits Conference (ISSCC), pp. 238\u2013239 (2017)","DOI":"10.1109\/ISSCC.2017.7870349"},{"key":"4_CR6","unstructured":"Movidius: Movidius neural compute stick: accelerate deep learning development at the edge (2020). https:\/\/developer.movidius.com\/"},{"key":"4_CR7","doi-asserted-by":"crossref","unstructured":"Chen, Y.-H., Emer, J., Sze, V.: Eyeriss: a spatial architecture for energy-efficient dataflow for convolutional neural networks. In: 2016 ACM\/IEEE 43rd Annual International Symposium on Computer Architecture (ISCA), pp. 367\u2013379 (2016)","DOI":"10.1109\/ISCA.2016.40"},{"key":"4_CR8","unstructured":"NVIDIA: Nvidia deep learning accelerator (2020). https:\/\/developer.nvidia.com\/embedded\/buy\/tegra-k1-processor"},{"key":"4_CR9","doi-asserted-by":"publisher","unstructured":"Blott, M., Preusser, T., Fraser, N., Gambardella, G., O\u2019Brien, K., Umuroglu, Y.: FINN-R: an end-to-end deep-learning framework for fast exploration of quantized neural networks. ACM Trans. Reconfigurable Technol. Syst. (TRETS) (2018). https:\/\/doi.org\/10.1145\/3242897","DOI":"10.1145\/3242897"},{"key":"4_CR10","doi-asserted-by":"publisher","unstructured":"Meloni, P., et al.: NEURAghe: exploiting CPU-FPGA synergies for efficient and flexible CNN inference acceleration on Zynq SoCs. ACM Trans. Reconfigurable Technol. Syst. (TRETS) (2018). https:\/\/doi.org\/10.1145\/3284357","DOI":"10.1145\/3284357"},{"key":"4_CR11","unstructured":"NVIDIA: cuDNN (2020). https:\/\/developer.nvidia.com\/cudnn"},{"key":"4_CR12","unstructured":"Lai, L., Suda, N., Chandra, V.: CMSIS-NN: efficient neural network kernels for Arm Cortex-M CPUs. CoRR, abs\/1801.06601 (2018). http:\/\/arxiv.org\/abs\/1801.06601"},{"key":"4_CR13","unstructured":"ARM-NN (2020). https:\/\/www.arm.com\/products\/silicon-ip-cpu\/machine-learning\/arm-nn"},{"key":"4_CR14","doi-asserted-by":"publisher","unstructured":"Han, S., et al.: EIE: efficient inference engine on compressed deep neural network. In: ISCA 2016: Proceedings of the 43rd International Symposium on Computer Architecture, pp. 243\u2013254, June 2016. https:\/\/doi.org\/10.1109\/ISCA.2016.30","DOI":"10.1109\/ISCA.2016.30"},{"key":"4_CR15","doi-asserted-by":"publisher","unstructured":"Han, S., et\u00a0al.: ESE: efficient speech recognition engine with sparse LSTM on FPGA. In: FPGA 2017: Proceedings of the 2017 ACM\/SIGDA International Symposium on Field-Programmable Gate Arrays, pp. 75\u201384, February 2017. https:\/\/doi.org\/10.1145\/3020078.3021745","DOI":"10.1145\/3020078.3021745"},{"key":"4_CR16","unstructured":"Theodorakopoulos, I., Pothos, V., Kastaniotis, D., Fragoulis, N.: Parsimonious inference on convolutional neural networks: learning and applying on-line kernel activation rules. CoRR, abs\/1701.05221 (2017). https:\/\/arxiv.org\/abs\/1701.05221"},{"key":"4_CR17","unstructured":"Krizhevsky, A.: Learning multiple layers of features from tiny images (2009). https:\/\/www.cs.toronto.edu\/~kriz\/learning-features-2009-TR.pdf"},{"key":"4_CR18","unstructured":"Iandola, F.N., et\u00a0al.: SqueezeNet: AlexNet-Level accuracy with 50x fewer parameters and $$<$$0.5 mb model size. CoRR, abs\/1602.07360 (2016). http:\/\/arxiv.org\/abs\/1602.07360"},{"key":"4_CR19","unstructured":"Zhang, Y., Suda, N., Lai, L., Chandra, V.: Hello edge: keyword spotting on microcontrollers. CoRR, arXiv:1711.07128 (2017)"},{"key":"4_CR20","unstructured":"Han, S., Mao, H., Dally, W.J.: Deep compression: compressing deep neural networks with pruning, trained quantization and Huffman coding. In: International Conference on Learning Representations 2016, October 2015. https:\/\/arxiv.org\/abs\/1510.00149"},{"key":"4_CR21","unstructured":"Gope, D., Dasika, G., Mattina, M.: Ternary hybrid neural-tree networks for highly constrained IoT applications (2019)"},{"key":"4_CR22","doi-asserted-by":"publisher","unstructured":"Hua, W., Zhou, Y., De\u00a0Sa, C., Zhang, Z., Suh, G.E.: Boosting the performance of CNN accelerators with dynamic fine-grained channel gating. In: Proceedings of the 52nd Annual IEEE\/ACM International Symposium on Microarchitecture, ser. MICRO 52, pp. 139\u2013150.\u00a0Association for Computing Machinery, New York (2019). https:\/\/doi.org\/10.1145\/3352460.3358283","DOI":"10.1145\/3352460.3358283"},{"key":"4_CR23","unstructured":"Lin, J., Rao, Y., Lu, J., Zhou, J.: Runtime neural pruning. In: Advances in Neural Information Processing Systems, vol.\u00a030.\u00a0Curran Associates, Inc. (2017). https:\/\/proceedings.neurips.cc\/paper\/2017\/file\/a51fb975227d6640e4fe47854476d133-Paper.pdf"},{"key":"4_CR24","unstructured":"Tschannen, M., Khanna, A., Anandkumar, A.: StrassenNets: deep learning with a multiplication budget. In: Dy, J., Krause, A. (eds.) Proceedings of the 35th International Conference on Machine Learning, ser. Proceedings of Machine Learning Research, vol.\u00a080, pp. 4985\u20134994.\u00a0PMLR, 10\u201315 July 2018. https:\/\/proceedings.mlr.press\/v80\/tschannen18a.html"},{"key":"4_CR25","unstructured":"Kumar, A., Goyal, S., Varma, M.: Resource-efficient machine learning in 2 KB RAM for the internet of things. In: Precup, D., Teh, Y.W. (eds.) Proceedings of the 34th International Conference on Machine Learning, ser. Proceedings of Machine Learning Research, vol.\u00a070, pp. 1935\u20131944.\u00a0PMLR, 06\u201311 August 2017. https:\/\/proceedings.mlr.press\/v70\/kumar17a.html"},{"key":"4_CR26","unstructured":"Warden, P.: Speech commands: a dataset for limited-vocabulary speech recognition. CoRR, arXiv:1804.03209 (2018)"},{"key":"4_CR27","doi-asserted-by":"publisher","unstructured":"Scrugli, M.A., Loi, D., Raffo, L., Meloni, P.: A runtime-adaptive cognitive IoT node for healthcare monitoring. In: Proceedings of the 16th Conference on Computing Frontiers (CF 2019), pp. 350\u2013357, April 2019. https:\/\/doi.org\/10.1145\/3310273.3323160","DOI":"10.1145\/3310273.3323160"}],"container-title":["Lecture Notes in Computer Science","Design and Architecture for Signal and Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-12748-9_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,29]],"date-time":"2022-07-29T14:31:03Z","timestamp":1659105063000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-12748-9_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031127472","9783031127489"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-12748-9_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"30 July 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"DASIP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Workshop on Design and Architecture for Signal and Image Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Budapest","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hungary","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 June 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 June 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"1","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"dasip2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/dasip2022.agh.edu.pl\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"32","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"13","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"41% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3,4","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}