{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,1,7]],"date-time":"2024-01-07T00:15:21Z","timestamp":1704586521001},"reference-count":24,"publisher":"Institute of Electronics, Information and Communications Engineers (IEICE)","issue":"1","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEICE Trans. Inf. &amp; Syst."],"published-print":{"date-parts":[[2024,1,1]]},"DOI":"10.1587\/transinf.2023edp7107","type":"journal-article","created":{"date-parts":[[2023,12,31]],"date-time":"2023-12-31T22:39:18Z","timestamp":1704062358000},"page":"83-92","source":"Crossref","is-referenced-by-count":0,"title":["Research on Lightweight Acoustic Scene Perception Method Based on Drunkard Methodology"],"prefix":"10.1587","volume":"E107.D","author":[{"given":"Wenkai","family":"LIU","sequence":"first","affiliation":[{"name":"North China University of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lin","family":"ZHANG","sequence":"additional","affiliation":[{"name":"North China University of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Menglong","family":"WU","sequence":"additional","affiliation":[{"name":"North China University of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xichang","family":"CAI","sequence":"additional","affiliation":[{"name":"North China University of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hongxia","family":"DONG","sequence":"additional","affiliation":[{"name":"North China University of Technology"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"532","reference":[{"key":"1","unstructured":"[1] I. Mart\u00edn-Morat\u00f3, F. Paissan, A. Ancilotto, et al., \u201cLow-complexity acoustic scene classification in dcase 2022 challenge,\u201d arXiv preprint arXiv:2206.03835, 2022."},{"key":"2","doi-asserted-by":"publisher","unstructured":"[2] W. Xie, Q. He, Z. Yu, and Y. Li, \u201cDeep mutual attention network for acoustic scene classification,\u201d Digital Signal Processing, vol.123, p.103450, 2022. 10.1016\/j.dsp.2022.103450","DOI":"10.1016\/j.dsp.2022.103450"},{"key":"3","doi-asserted-by":"publisher","unstructured":"[3] T. Choudhary, V. Mishra, A. Goswami, and J. Sarangapani, \u201cA comprehensive survey on model compression and acceleration,\u201d Artificial Intelligence Review, vol.53, no.7, pp.5113-5155, 2020. 10.1007\/s10462-020-09816-7","DOI":"10.1007\/s10462-020-09816-7"},{"key":"4","doi-asserted-by":"publisher","unstructured":"[4] M. Agarwal, S.K. Gupta, M. Biswas, and D. Garg, \u201cCompression and acceleration of convolution neural network: a genetic algorithm based approach,\u201d Journal of Ambient Intelligence and Humanized Computing, vol.14, no.10, pp.13387-13397, 2022. 10.1007\/s12652-022-03793-1","DOI":"10.1007\/s12652-022-03793-1"},{"key":"5","unstructured":"[5] B. Kim, S. Yang, J. Kim, et al., \u201cQTI submission to DCASE 2021: Residual normalization for device-imbalanced acoustic scene classification with efficient design,\u201d arXiv preprint arXiv:2206.13909, 2022."},{"key":"6","unstructured":"[6] J.H. Lee, J.H. Choi, P.M. Byun, et al., \u201cHYU submission for the DCASE 2022: fine-tuning method using device-aware data-random-drop for device-imbalanced acoustic scene classification,\u201d 2022."},{"key":"7","doi-asserted-by":"publisher","unstructured":"[7] S.-H. Gao, M.-M. Cheng, K. Zhao, X.-Y. Zhang, M.-H. Yang, and P. Torr, \u201cRes2net: A new multi-scale backbone architecture,\u201d IEEE transactions on pattern analysis and machine intelligence, vol.43, no.2, pp.652-662, 2021. 10.1109\/tpami.2019.2938758","DOI":"10.1109\/TPAMI.2019.2938758"},{"key":"8","doi-asserted-by":"crossref","unstructured":"[8] A. Howard, M. Sandler, B. Chen, W. Wang, L.-C. Chen, M. Tan, G. Chu, V. Vasudevan, Y. Zhu, R. Pang, H. Adam, and Q. Le, \u201cSearching for mobilenetv3,\u201d Proceedings of the IEEE\/CVF international conference on computer vision. 1314-1324, 2019. 10.1109\/iccv.2019.00140","DOI":"10.1109\/ICCV.2019.00140"},{"key":"9","doi-asserted-by":"crossref","unstructured":"[9] N. Ma, X. Zhang, H.-T. Zheng, and J. Sun, \u201cShufflenet v2: Practical guidelines for efficient CNN architecture design,\u201d Proceedings of the European conference on computer vision (ECCV), pp.122-138, 2018. 10.1007\/978-3-030-01264-9_8","DOI":"10.1007\/978-3-030-01264-9_8"},{"key":"10","doi-asserted-by":"publisher","unstructured":"[10] Y. Qu, X. Li, Z. Qin, and Q. Lu, \u201cAcoustic scene classification based on three-dimensional multi-channel feature-correlated deep learning networks,\u201d Scientific Reports, vol.12, no.1, 2022. 10.1038\/s41598-022-17863-z","DOI":"10.1038\/s41598-022-17863-z"},{"key":"11","doi-asserted-by":"publisher","unstructured":"[11] Y. Ding, Z. Zhang, X. Zhao, D. Hong, W. Cai, C. Yu, N. Yang, and W. Cai, \u201cMulti-feature fusion: Graph neural network and CNN combining for hyperspectral image classification,\u201d Neurocomputing, vol.501, pp.246-257, 2022. 10.1016\/j.neucom.2022.06.031","DOI":"10.1016\/j.neucom.2022.06.031"},{"key":"12","doi-asserted-by":"publisher","unstructured":"[12] W. Zou, D. Zhang, and D.-J. Lee, \u201cA new multi-feature fusion based convolutional neural network for facial expression recognition,\u201d Applied Intelligence, vol.52, no.3, pp.2918-2929, 2022. 10.1007\/s10489-021-02575-0","DOI":"10.1007\/s10489-021-02575-0"},{"key":"13","doi-asserted-by":"crossref","unstructured":"[13] J. Hu, L. Shen, and G. Sun, \u201cSqueeze-and-excitation networks,\u201d Proceedings of the IEEE conference on computer vision and pattern recognition, pp.7132-7141, 2018. 10.1109\/cvpr.2018.00745","DOI":"10.1109\/CVPR.2018.00745"},{"key":"14","unstructured":"[14] G. Hinton, O. Vinyals and J. Dean, \u201cDistilling the knowledge in a neural network,\u201d arXiv preprint arXiv:1503.02531, 2015."},{"key":"15","doi-asserted-by":"crossref","unstructured":"[15] R. He, S. Sun, J. Yang, S. Bai, and X. Qi, \u201cKnowledge distillation as efficient pre-training: Faster convergence, higher data-efficiency, and better transferability,\u201d Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp.9161-9171, 2022. 10.1109\/cvpr52688.2022.00895","DOI":"10.1109\/CVPR52688.2022.00895"},{"key":"16","doi-asserted-by":"crossref","unstructured":"[16] G. Chen, J. Chen, F. Feng, S. Zhou, and X. He, \u201cUnbiased Knowledge Distillation for Recommendation,\u201d Proceedings of the Sixteenth ACM International Conference on Web Search and Data Mining, 2023. 10.1145\/3539597.3570477","DOI":"10.1145\/3539597.3570477"},{"key":"17","doi-asserted-by":"crossref","unstructured":"[17] K. Han, Y. Wang, Q. Tian, J. Guo, C. Xu, and C. Xu, \u201cGhostnet: More features from cheap operations,\u201d Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp.1580-1589, 2020. 10.1109\/cvpr42600.2020.00165","DOI":"10.1109\/CVPR42600.2020.00165"},{"key":"18","doi-asserted-by":"crossref","unstructured":"[18] K. He, X. Zhang, S. Ren, and J. Sun, \u201cDeep residual learning for image recognition,\u201d Proceedings of the IEEE conference on computer vision and pattern recognition, pp.770-778, 2016. 10.1109\/cvpr.2016.90","DOI":"10.1109\/CVPR.2016.90"},{"key":"19","unstructured":"[19] A. Mesaros, T. Heittola, and T. Virtanen, \u201cA multi-device dataset for urban acoustic scene classification,\u201d arXiv preprint arXiv:1807.09840, 2018."},{"key":"20","doi-asserted-by":"crossref","unstructured":"[20] Y. Li, W. Cao, W. Xie, Q. Huang, W. Pang, and Q. He, \u201cLow-Complexity Acoustic Scene Classification Using Data Augmentation and Lightweight ResNet,\u201d 2022 16th IEEE International Conference on Signal Processing (ICSP). IEEE, pp.41-45, 2022. 10.1109\/icsp56322.2022.9965347","DOI":"10.1109\/ICSP56322.2022.9965347"},{"key":"21","unstructured":"[21] H. Zhang, M. Cisse, Y.N. Dauphin, et al., \u201cMixup: Beyond empirical risk minimization,\u201d arXiv preprint arXiv:1710.09412, 2017."},{"key":"22","doi-asserted-by":"crossref","unstructured":"[22] D.S. Park, W. Chan, Y. Zhang, C.-C. Chiu, B. Zoph, E.D. Cubuk, and Q.V. Le, \u201cSpecaugment: A simple data augmentation method for automatic speech recognition,\u201d arXiv preprint arXiv:1904.08779, 2019.","DOI":"10.21437\/Interspeech.2019-2680"},{"key":"23","doi-asserted-by":"crossref","unstructured":"[23] Q. Hou, D. Zhou, and J. Feng, \u201cCoordinate attention for efficient mobile network design,\u201d Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp.13713-13722, 2021. 10.1109\/cvpr46437.2021.01350","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"24","doi-asserted-by":"crossref","unstructured":"[24] M. Sandler, A. Howard, M. Zhu, A. Zhmoginov, and L.-C. Chen, \u201cMobileNetV2: Inverted Residuals and Linear Bottlenecks,\u201d 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2018. 10.1109\/cvpr.2018.00474","DOI":"10.1109\/CVPR.2018.00474"}],"container-title":["IEICE Transactions on Information and Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/transinf\/E107.D\/1\/E107.D_2023EDP7107\/_pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,6]],"date-time":"2024-01-06T04:14:48Z","timestamp":1704514488000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/transinf\/E107.D\/1\/E107.D_2023EDP7107\/_article"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,1]]},"references-count":24,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2024]]}},"URL":"https:\/\/doi.org\/10.1587\/transinf.2023edp7107","relation":{},"ISSN":["0916-8532","1745-1361"],"issn-type":[{"value":"0916-8532","type":"print"},{"value":"1745-1361","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,1,1]]},"article-number":"2023EDP7107"}}