{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T15:48:48Z","timestamp":1778082528270,"version":"3.51.4"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2023,1,21]],"date-time":"2023-01-21T00:00:00Z","timestamp":1674259200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,21]],"date-time":"2023-01-21T00:00:00Z","timestamp":1674259200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["51821093"],"award-info":[{"award-number":["51821093"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"High-level Talent Special Support Plan of Zhejiang Province","award":["2020R52004"],"award-info":[{"award-number":["2020R52004"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SIViP"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s11760-022-02469-9","type":"journal-article","created":{"date-parts":[[2023,1,21]],"date-time":"2023-01-21T10:02:18Z","timestamp":1674295338000},"page":"2521-2529","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["MVHANet: multi-view hierarchical aggregation network for skeleton-based hand gesture recognition"],"prefix":"10.1007","volume":"17","author":[{"given":"Shaochen","family":"Li","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenyu","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guifang","family":"Duan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jianrong","family":"Tan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,1,21]]},"reference":[{"key":"2469_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2020.102085","volume":"68","author":"C Nuzzi","year":"2021","unstructured":"Nuzzi, C., Pasinetti, S., Pagani, R., Ghidini, S., Beschi, M., Coffetti, G., Sansoni, G.: MEGURU: a gesture-based robot program builder for Meta-Collaborative workstations. Robot. Comput.-Integr. Manuf. 68, 102085 (2021)","journal-title":"Robot. Comput.-Integr. Manuf."},{"key":"2469_CR2","doi-asserted-by":"publisher","first-page":"2055","DOI":"10.1007\/s11760-022-02167-6","volume":"16","author":"A Boukdir","year":"2022","unstructured":"Boukdir, A., Benaddy, M., Ellahyani, A., Meslouhi, O.E., Kardouchi, M.: 3D gesture segmentation for word-level Arabic sign language using large-scale RGB video sequences and autoencoder convolutional networks. SIViP 16, 2055\u20132062 (2022)","journal-title":"SIViP"},{"key":"2469_CR3","doi-asserted-by":"publisher","first-page":"31059","DOI":"10.1007\/s11042-020-09731-7","volume":"80","author":"P Wang","year":"2021","unstructured":"Wang, P., Bai, X., Billinghurst, M., Zhang, S., Wei, S., Xu, G., He, W., Zhang, X., Zhang, J.: 3DGAM: using 3D gesture and CAD models for training on mixed reality remote collaboration. Multimed. Tools Appl 80, 31059\u201331084 (2021)","journal-title":"Multimed. Tools Appl"},{"key":"2469_CR4","doi-asserted-by":"crossref","unstructured":"Zhang, P., Lan, C., Xing, J., Zeng, W., Xue, J., Zheng, N.: View adaptive recurrent neural networks for high performance human action recognition from skeleton data. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 2136\u20132145 (2017)","DOI":"10.1109\/ICCV.2017.233"},{"key":"2469_CR5","doi-asserted-by":"crossref","unstructured":"Molchanov, P., Gupta, S., Kim, K., Kautz, J.: Hand gesture recognition with 3D convolutional neural networks. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), pp. 1\u20137 (2015)","DOI":"10.1109\/CVPRW.2015.7301342"},{"key":"2469_CR6","doi-asserted-by":"crossref","unstructured":"De Smedt, Q., Wannous, H., Vandeborre, J.-P.: Skeleton-based dynamic hand gesture recognition. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), pp. 1206\u20131214 (2016)","DOI":"10.1109\/CVPRW.2016.153"},{"key":"2469_CR7","unstructured":"Smedt, Q.D., Wannous, H., Vandeborre, J.-P., Guerry, J., Saux, B.L., Filliat, D.: SHREC'17 track: 3D hand gesture recognition using a depth and skeletal dataset. In: 3DOR-10th Eurographics Workshop on 3D Object Retrieval, pp. 1\u20136 (2017)"},{"key":"2469_CR8","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1016\/j.patcog.2015.11.019","volume":"53","author":"L Lo Presti","year":"2016","unstructured":"Lo Presti, L., La Cascia, M.: 3D skeleton-based human action classification: a survey. Pattern Recogn. 53, 130\u2013147 (2016)","journal-title":"Pattern Recogn."},{"key":"2469_CR9","doi-asserted-by":"publisher","first-page":"18258","DOI":"10.1109\/ACCESS.2020.2968361","volume":"8","author":"F Guo","year":"2020","unstructured":"Guo, F., He, Z., Zhang, S., Zhao, X., Tan, J.: Attention-based pose sequence machine for 3D hand pose estimation. IEEE Access 8, 18258\u201318269 (2020)","journal-title":"IEEE Access"},{"key":"2469_CR10","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1109\/TMM.2018.2856094","volume":"21","author":"D Avola","year":"2019","unstructured":"Avola, D., Bernardi, M., Cinque, L., Foresti, G.L., Massaroni, C.: Exploiting recurrent neural networks and leap motion controller for the recognition of sign language and semaphoric hand gestures. IEEE Trans. Multimed. 21, 234\u2013245 (2019)","journal-title":"IEEE Trans. Multimed."},{"key":"2469_CR11","doi-asserted-by":"publisher","first-page":"239","DOI":"10.3390\/s19020239","volume":"19","author":"X Chen","year":"2019","unstructured":"Chen, X., Wang, G., Guo, H., Zhang, C., Wang, H., Zhang, L.: MFA-Net: motion feature augmented network for dynamic hand gesture recognition from skeletal data. Sensors. 19, 239 (2019)","journal-title":"Sensors."},{"key":"2469_CR12","doi-asserted-by":"crossref","unstructured":"Li, C., Zhong, Q., Xie, D., Pu, S.: Co-occurrence feature learning from skeleton data for action recognition and detection with hierarchical aggregation. In: Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, pp. 786\u2013792 (2018)","DOI":"10.24963\/ijcai.2018\/109"},{"key":"2469_CR13","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1016\/j.patcog.2017.10.033","volume":"76","author":"JC N\u00fa\u00f1ez","year":"2018","unstructured":"N\u00fa\u00f1ez, J.C., Cabido, R., Pantrigo, J.J., Montemayor, A.S., V\u00e9lez, J.F.: Convolutional Neural Networks and Long Short-Term Memory for skeleton-based human activity and hand gesture recognition. Pattern Recogn. 76, 80\u201394 (2018)","journal-title":"Pattern Recogn."},{"key":"2469_CR14","doi-asserted-by":"crossref","unstructured":"Hou, J., Wang, G., Chen, X., Xue, J.-H., Zhu, R., Yang, H.: Spatial-temporal attention Res-TCN for skeleton-based dynamic hand gesture recognition. In: Leal-Taix\u00e9, L., Roth, S. (eds.) Proceedings of the European Conference on Computer Vision (ECCV), pp. 273\u2013286 (2019)","DOI":"10.1007\/978-3-030-11024-6_18"},{"key":"2469_CR15","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1109\/TMM.2018.2859620","volume":"21","author":"Z Fan","year":"2019","unstructured":"Fan, Z., Zhao, X., Lin, T., Su, H.: Attention-based multiview re-observation fusion network for skeletal action recognition. IEEE Trans. Multimed. 21, 363\u2013374 (2019)","journal-title":"IEEE Trans. Multimed."},{"key":"2469_CR16","doi-asserted-by":"crossref","unstructured":"Feng, Y., Zhang, Z., Zhao, X., Ji, R., Gao, Y.: GVCNN: group-view convolutional neural networks for 3D shape recognition. In: 2018 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 264\u2013272 (2018)","DOI":"10.1109\/CVPR.2018.00035"},{"key":"2469_CR17","doi-asserted-by":"crossref","unstructured":"Su, H., Maji, S., Kalogerakis, E., Learned-Miller, E.: Multi-view convolutional neural networks for 3D shape recognition. arXiv:1505.00880 [cs] (2015)","DOI":"10.1109\/ICCV.2015.114"},{"key":"2469_CR18","unstructured":"Wang, C., Pelillo, M., Siddiqi, K.: Dominant set clustering and pooling for multi-view 3D object recognition. arXiv:1906.01592 [cs] (2019)"},{"key":"2469_CR19","doi-asserted-by":"crossref","unstructured":"Garcia-Hernando, G., Yuan, S., Baek, S., Kim, T.-K.: First-person hand action benchmark with RGB-D videos and 3D hand pose annotations. In: 2018 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 409\u2013419 (2018)","DOI":"10.1109\/CVPR.2018.00050"},{"key":"2469_CR20","doi-asserted-by":"publisher","first-page":"1369","DOI":"10.1109\/TMM.2014.2314073","volume":"16","author":"K Ding","year":"2014","unstructured":"Ding, K., Liu, Y.-H.: Sphere image for 3-D model retrieval. IEEE Trans. Multimed. 16, 1369\u20131376 (2014)","journal-title":"IEEE Trans. Multimed."},{"key":"2469_CR21","doi-asserted-by":"crossref","unstructured":"Biermann, H., Levin, A., Zorin, D.: Piecewise smooth subdivision surfaces with normal control. In: Proceedings of the 27th Annual Conference on Computer Graphics and Interactive Techniques, pp. 113\u2013120 (2000)","DOI":"10.1145\/344779.344841"},{"key":"2469_CR22","doi-asserted-by":"publisher","first-page":"92","DOI":"10.2307\/2346308","volume":"22","author":"HR Neave","year":"1973","unstructured":"Neave, H.R.: On using the Box\u2013Muller transformation with multiplicative congruential pseudo-random number generators. Appl. Stat. 22, 92 (1973)","journal-title":"Appl. Stat."},{"key":"2469_CR23","doi-asserted-by":"publisher","first-page":"5560","DOI":"10.1109\/TIP.2017.2740122","volume":"26","author":"B Liang","year":"2017","unstructured":"Liang, B., Li, H.: Specificity and latent correlation learning for action recognition using synthetic multi-view data from depth maps. IEEE Trans. Image Process. 26, 5560\u20135574 (2017)","journal-title":"IEEE Trans. Image Process."},{"key":"2469_CR24","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.-Y., Kweon, I.S.: CBAM: Convolutional block attention module. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) Proceedings of the European Conference on Computer Vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"2469_CR25","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv:1412.6980 [cs]. (2017)"},{"key":"2469_CR26","doi-asserted-by":"crossref","unstructured":"Boulahia, S.Y., Anquetil, E., Multon, F., Kulpa, R.: Dynamic hand gesture recognition based on 3D pattern assembled trajectories. In: 2017 Seventh International Conference on Image Processing Theory, Tools and Applications (IPTA), pp. 1\u20136 (2017)","DOI":"10.1109\/IPTA.2017.8310146"},{"key":"2469_CR27","doi-asserted-by":"crossref","unstructured":"Tu, J., Liu, M., Liu, H.: Skeleton-based human action recognition using spatial temporal 3D convolutional neural networks. In: 2018 IEEE International Conference on Multimedia and Expo (ICME), pp. 1\u20136 (2018)","DOI":"10.1109\/ICME.2018.8486566"},{"key":"2469_CR28","doi-asserted-by":"crossref","unstructured":"Yan, S., Xiong, Y., Lin, D.: Spatial temporal graph convolutional networks for skeleton-based action recognition. In: AAAI Conference on Artificial Intelligence, pp 7444\u20137452 (2018)","DOI":"10.1609\/aaai.v32i1.12328"},{"key":"2469_CR29","unstructured":"Chen, Y.: Construct dynamic graphs for hand gesture recognition via spatial-temporal attention. arXiv:1907.08871 [cs] (2019)"},{"key":"2469_CR30","doi-asserted-by":"crossref","unstructured":"Nguyen, X.S., Brun, L., L\u00e9zoray, O., Bougleux, S.: A neural network based on SPD manifold learning for skeleton-based hand gesture recognition. arXiv:1904.12970 [cs] (2019)","DOI":"10.1109\/CVPR.2019.01231"},{"key":"2469_CR31","doi-asserted-by":"crossref","unstructured":"Vemulapalli, R., Arrate, F., Chellappa, R.: Human action recognition by representing 3D skeletons as points in a Lie group. In: 2014 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 588\u2013595 (2014)","DOI":"10.1109\/CVPR.2014.82"},{"key":"2469_CR32","doi-asserted-by":"crossref","unstructured":"Garcia-Hernando, G., Kim, T.-K.: Transition forests: learning discriminative temporal transitions for action recognition and detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 407\u2013415 (2017)","DOI":"10.1109\/CVPR.2017.51"},{"key":"2469_CR33","doi-asserted-by":"crossref","unstructured":"Huang, Z., Van Gool, L.: A Riemannian network for SPD matrix learning. arXiv:1608.04233 [cs] (2016)","DOI":"10.1609\/aaai.v31i1.10866"},{"key":"2469_CR34","doi-asserted-by":"crossref","unstructured":"Zhang, X., Wang, Y., Gou, M., Sznaier, M., Camps, O.: Efficient temporal sequence comparison and classification using gram matrix embeddings on a Riemannian manifold. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4498\u20134507 (2016)","DOI":"10.1109\/CVPR.2016.487"}],"container-title":["Signal, Image and Video Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-022-02469-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11760-022-02469-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-022-02469-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,18]],"date-time":"2023-05-18T00:30:24Z","timestamp":1684369824000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11760-022-02469-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,21]]},"references-count":34,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["2469"],"URL":"https:\/\/doi.org\/10.1007\/s11760-022-02469-9","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-2285220\/v1","asserted-by":"object"}]},"ISSN":["1863-1703","1863-1711"],"issn-type":[{"value":"1863-1703","type":"print"},{"value":"1863-1711","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,1,21]]},"assertion":[{"value":"17 November 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 December 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 December 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 January 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}