{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T18:12:27Z","timestamp":1771956747640,"version":"3.50.1"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T00:00:00Z","timestamp":1642377600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T00:00:00Z","timestamp":1642377600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["MOST 109-2221-E-011-142"],"award-info":[{"award-number":["MOST 109-2221-E-011-142"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["110-2221-E-011-155"],"award-info":[{"award-number":["110-2221-E-011-155"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2022,6]]},"DOI":"10.1007\/s00034-022-01952-5","type":"journal-article","created":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T19:02:36Z","timestamp":1642446156000},"page":"3547-3569","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["The Data Flow and Architectural Optimizations for a Highly Efficient CNN Accelerator Based on the Depthwise Separable Convolution"],"prefix":"10.1007","volume":"41","author":[{"given":"Hung-Ju","family":"Lin","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0628-5129","authenticated-orcid":false,"given":"Chung-An","family":"Shen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,1,17]]},"reference":[{"issue":"4","key":"1952_CR1","doi-asserted-by":"publisher","first-page":"1349","DOI":"10.1109\/TCSI.2017.2757036","volume":"65","author":"A Ardakani","year":"2018","unstructured":"A. Ardakani, C. Condo, M. Ahmadi, W.J. Gross, An architecture to accelerate convolution in deep neural networks. IEEE Trans. Circuits Syst. I Regul. Pap. 65(4), 1349\u20131362 (2018)","journal-title":"IEEE Trans. Circuits Syst. I Regul. Pap."},{"issue":"10","key":"1952_CR2","doi-asserted-by":"publisher","first-page":"1415","DOI":"10.1109\/TCSII.2018.2865896","volume":"65","author":"L Bai","year":"2018","unstructured":"L. Bai, Y. Zhao, X. Huang, A CNN accelerator on FPGA using depthwise separable convolution. IEEE Trans. Circuits Syst. II Express Briefs 65(10), 1415\u20131419 (2018)","journal-title":"IEEE Trans. Circuits Syst. II Express Briefs"},{"issue":"2","key":"1952_CR3","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1109\/MCE.2017.2775245","volume":"7","author":"S Bazrafkan","year":"2018","unstructured":"S. Bazrafkan, P.M. Corcoran, Pushing the AI envelope: merging deep networks to accelerate edge artificial intelligence in consumer electronics devices and systems. IEEE Consum. Electron. Mag. 7(2), 55\u201361 (2018)","journal-title":"IEEE Consum. Electron. Mag."},{"key":"1952_CR4","doi-asserted-by":"crossref","unstructured":"W. Chen, Z. Wang, S. Li, Z. Yu, H. Li, Accelerating compact convolutional neural networks with multi-threaded data streaming. in 2019 IEEE Computer Society Annual Symposium on VLSI (ISVLSI), pp. 519\u2013522 (2019)","DOI":"10.1109\/ISVLSI.2019.00099"},{"issue":"3","key":"1952_CR5","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1109\/MM.2017.54","volume":"37","author":"Y Chen","year":"2017","unstructured":"Y. Chen, J. Emer, V. Sze, Using dataflow to optimize energy efficiency of deep neural network accelerators. IEEE Micro 37(3), 12\u201321 (2017)","journal-title":"IEEE Micro"},{"issue":"1","key":"1952_CR6","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1109\/JSSC.2016.2616357","volume":"52","author":"Y Chen","year":"2017","unstructured":"Y. Chen, T. Krishna, J.S. Emer, V. Sze, Eyeriss: an energy-efficient reconfigurable accelerator for deep convolutional neural networks. IEEE J. Solid-State Circuits 52(1), 127\u2013138 (2017)","journal-title":"IEEE J. Solid-State Circuits"},{"issue":"2","key":"1952_CR7","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1109\/JETCAS.2019.2910232","volume":"9","author":"Y Chen","year":"2019","unstructured":"Y. Chen, T. Yang, J. Emer, V. Sze, Eyeriss v2: a flexible accelerator for emerging deep neural networks on mobile devices. IEEE J. Emerg. Sel. Top. Circuits Syst. 9(2), 292\u2013308 (2019)","journal-title":"IEEE J. Emerg. Sel. Top. Circuits Syst."},{"key":"1952_CR8","doi-asserted-by":"crossref","unstructured":"G. Desoli et al., 14.1 A 2.9TOPS\/W deep convolutional neural network SoC in FD-SOI 28nm for intelligent embedded systems, in IEEE International Solid-State Circuits Conference (ISSCC), pp. 238\u2013239 (2017)","DOI":"10.1109\/ISSCC.2017.7870349"},{"key":"1952_CR9","doi-asserted-by":"crossref","unstructured":"Z. Du\u00a0et al., ShiDianNao: Shifting vision processing closer to the sensor, in 2015 ACM\/IEEE Annual International Symposium on Computer Architecture, pp. 92\u2013104 (2015)","DOI":"10.1145\/2872887.2750389"},{"issue":"3","key":"1952_CR10","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1109\/MCE.2019.2892286","volume":"8","author":"L Jian","year":"2019","unstructured":"L. Jian, Z. Li, X. Yang, W. Wu, A. Ahmad, G. Jeon, Combining unmanned aerial vehicles with artificial-intelligence technology for traffic-congestion recognition: electronic eyes in the skies to spot clogged roads. IEEE Consumer Electron. Mag. 8(3), 81\u201386 (2019)","journal-title":"IEEE Consumer Electron. Mag."},{"issue":"6","key":"1952_CR11","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"A. Krizhevsky, S. Ilya, E.H. Geoffrey, Imagenet classification with deep convolutional neural networks. Commun. ACM 60(6), 84\u201390 (2017)","journal-title":"Commun. ACM"},{"issue":"4","key":"1952_CR12","first-page":"985","volume":"20","author":"J Li","year":"2017","unstructured":"J. Li, X. Liang, S. Shen, T. Xu, J. Feng, S. Yan, Scale-aware fast R-CNN for pedestrian detection. IEEE Trans. Multimedia 20(4), 985\u2013996 (2017)","journal-title":"IEEE Trans. Multimedia"},{"key":"1952_CR13","doi-asserted-by":"crossref","unstructured":"K.T. Malladi, F.A. Nothaft, K. Periyathambi, B.C. Lee, C. Kozyrakis and M. Horowitz, Towards energy-proportional datacenter memory with mobile DRAM, in 2012 39th Annual International Symposium on Computer Architecture (ISCA), pp. 37\u201348 (2012)","DOI":"10.1109\/ISCA.2012.6237004"},{"key":"1952_CR14","doi-asserted-by":"crossref","unstructured":"B. Moons, R. Uytterhoeven, W. Dehaene, M. Verhelst, 14.5 Envision: A 0.26-to-10TOPS\/W subword-parallel dynamic-voltage-accuracy-frequency-scalable Convolutional Neural Network processor in 28nm FDSOI, in 2017 IEEE International Solid-State Circuits Conference (ISSCC), pp. 246\u2013247 (2017)","DOI":"10.1109\/ISSCC.2017.7870353"},{"issue":"8","key":"1952_CR15","doi-asserted-by":"publisher","first-page":"3406","DOI":"10.1007\/s00034-019-01157-3","volume":"38","author":"T Ogunfunmi","year":"2019","unstructured":"T. Ogunfunmi, R.P. Ramachandran, R. Togneri, Y. Zhao, X. Xia, A primer on deep learning architectures and applications in speech processing. Circuits Syst. Signal Process 38(8), 3406\u20133432 (2019)","journal-title":"Circuits Syst. Signal Process"},{"key":"1952_CR16","doi-asserted-by":"publisher","first-page":"77661","DOI":"10.1109\/ACCESS.2021.3079337","volume":"9","author":"B Qiang","year":"2021","unstructured":"B. Qiang et al., SqueezeNet and fusion network-based accurate fast fully convolutional network for hand detection and gesture recognition. IEEE Access 9, 77661\u201377674 (2021)","journal-title":"IEEE Access"},{"key":"1952_CR17","doi-asserted-by":"crossref","unstructured":"D. Sinha, M. El-Sharkawy, Thin MobileNet: an enhanced MobileNet architecture, in IEEE Annual Ubiquitous Computing, Electronics & Mobile Communication Conference (UEMCON), pp. 0280\u20130285 (2019)","DOI":"10.1109\/UEMCON47517.2019.8993089"},{"key":"1952_CR18","unstructured":"L. Sifre, Rigid-motion scattering for image classification. PhD Thesis in Ecole Polytechnique, CMAP (2014)"},{"key":"1952_CR19","doi-asserted-by":"crossref","unstructured":"J. Su et al., Redundancy-reduced mobilenet acceleration on reconfigurable logic for ImageNet classification, in Applied Reconfigurable Computing. Architectures, Tools, and Applications, pp. 16\u201328 (2018)","DOI":"10.1007\/978-3-319-78890-6_2"},{"issue":"12","key":"1952_CR20","doi-asserted-by":"publisher","first-page":"2295","DOI":"10.1109\/JPROC.2017.2761740","volume":"105","author":"V Sze","year":"2017","unstructured":"V. Sze, Y. Chen, T. Yang, J.S. Emer, Efficient processing of deep neural networks: a tutorial and survey. Proc. IEEE 105(12), 2295\u20132329 (2017)","journal-title":"Proc. IEEE"},{"key":"1952_CR21","doi-asserted-by":"crossref","unstructured":"C. Szegedy\u00a0et al., Going deeper with convolutions, in IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"issue":"8","key":"1952_CR22","doi-asserted-by":"publisher","first-page":"3521","DOI":"10.1007\/s00034-019-01141-x","volume":"38","author":"X Wang","year":"2019","unstructured":"X. Wang, M. Tang, S. Yang, H. Yin, H. Huang, L. He, Automatic hypernasality detection in cleft palate speech using CNN. Circuits Syst. Signal Process. 38(8), 3521\u20133547 (2019)","journal-title":"Circuits Syst. Signal Process."},{"issue":"7","key":"1952_CR23","doi-asserted-by":"publisher","first-page":"2022","DOI":"10.1109\/TITS.2015.2482461","volume":"17","author":"Y Yang","year":"2016","unstructured":"Y. Yang, H. Luo, H. Xu, F. Wu, Towards real-time traffic sign detection and classification. IEEE Trans. Intell. Transp. Syst. 17(7), 2022\u20132031 (2016)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"1952_CR24","doi-asserted-by":"crossref","unstructured":"X. Zhang, X. Zhou, M. Lin, J. Sun, ShuffleNet: an extremely efficient convolutional neural network for mobile devices, in 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6848\u20136856 (2018)","DOI":"10.1109\/CVPR.2018.00716"},{"key":"1952_CR25","doi-asserted-by":"crossref","unstructured":"R. Zhao, X. Niu, W. Luk, Automatic optimising CNN with depthwise separable convolution on FPGA: (Abstact only), in Proceedings of the 2018 ACM\/SIGDA International Symposium on Field-Programmable Gate Array, p. 285 (2018)","DOI":"10.1145\/3174243.3174959"}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-01952-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-022-01952-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-01952-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,25]],"date-time":"2022-04-25T18:18:17Z","timestamp":1650910697000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-022-01952-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,1,17]]},"references-count":25,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2022,6]]}},"alternative-id":["1952"],"URL":"https:\/\/doi.org\/10.1007\/s00034-022-01952-5","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"value":"0278-081X","type":"print"},{"value":"1531-5878","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,1,17]]},"assertion":[{"value":"20 February 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 December 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 December 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 January 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}