{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,26]],"date-time":"2026-04-26T00:49:50Z","timestamp":1777164590928,"version":"3.51.4"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,7,29]],"date-time":"2022-07-29T00:00:00Z","timestamp":1659052800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,7,29]],"date-time":"2022-07-29T00:00:00Z","timestamp":1659052800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2023,1]]},"DOI":"10.1007\/s11042-022-13441-7","type":"journal-article","created":{"date-parts":[[2022,7,29]],"date-time":"2022-07-29T08:08:03Z","timestamp":1659082083000},"page":"4533-4550","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Motion saliency based hierarchical attention network for action recognition"],"prefix":"10.1007","volume":"82","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8917-1102","authenticated-orcid":false,"given":"Zihui","family":"Guo","sequence":"first","affiliation":[]},{"given":"Yonghong","family":"Hou","sequence":"additional","affiliation":[]},{"given":"Renyi","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Chuankun","family":"Li","sequence":"additional","affiliation":[]},{"given":"Wanqing","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,7,29]]},"reference":[{"key":"13441_CR1","doi-asserted-by":"crossref","unstructured":"Cao C, Lan C, Zhang Y, Zeng W, Lu H, Zhang Y (2018) Skeleton-based action recognition with gated convolutional neural networks. IEEE Trans Circ Syst Video Technol","DOI":"10.1109\/TCSVT.2018.2879913"},{"key":"13441_CR2","doi-asserted-by":"crossref","unstructured":"Chen C, Jafari R, Kehtarnavaz N (2015) Utd-mhad: a multimodal dataset for human action recognition utilizing a depth camera and a wearable inertial sensor. In: 2015 IEEE International conference on image processing (ICIP), pp 168\u2013172. IEEE","DOI":"10.1109\/ICIP.2015.7350781"},{"issue":"3","key":"13441_CR3","doi-asserted-by":"publisher","first-page":"1707","DOI":"10.1007\/s11042-019-08261-1","volume":"79","author":"Y Chen","year":"2020","unstructured":"Chen Y, Wang L, Li C, Hou Y, Li W (2020) Convnets-based action recognition from skeleton motion maps. Multimed Tools Appl 79 (3):1707\u20131725","journal-title":"Multimed Tools Appl"},{"issue":"2","key":"13441_CR4","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1109\/TMM.2018.2859620","volume":"21","author":"Z Fan","year":"2018","unstructured":"Fan Z, Zhao X, Lin T, Su H (2018) Attention-based multiview re-observation fusion network for skeletal action recognition. IEEE Trans Multimed 21 (2):363\u2013374","journal-title":"IEEE Trans Multimed"},{"issue":"1","key":"13441_CR5","doi-asserted-by":"publisher","first-page":"591","DOI":"10.1007\/s11042-017-5290-9","volume":"78","author":"J Feng","year":"2019","unstructured":"Feng J, Zhang S, Xiao J (2019) Explorations of skeleton features for lstm-based action recognition. Multimed Tools Appl 78(1):591\u2013603","journal-title":"Multimed Tools Appl"},{"key":"13441_CR6","doi-asserted-by":"crossref","unstructured":"Gao X, Hu W, Tang J, Liu J, Guo Z (2019) Optimized skeleton-based action recognition via sparsified graph regression. In: Proceedings of the 27th ACM international conference on multimedia, pp 601\u2013610. ACM","DOI":"10.1145\/3343031.3351170"},{"key":"13441_CR7","doi-asserted-by":"crossref","unstructured":"Han Y, Chung SL, Ambikapathi A, Chan JS, Lin WY, Su SF (2018) Robust human action recognition using global spatial-temporal attention for human skeleton data. In: 2018 International joint conference on neural networks (IJCNN), pp 1\u20138. IEEE","DOI":"10.1109\/IJCNN.2018.8489386"},{"key":"13441_CR8","doi-asserted-by":"publisher","first-page":"88604","DOI":"10.1109\/ACCESS.2020.2992740","volume":"8","author":"Y Han","year":"2020","unstructured":"Han Y, Chung SL, Xiao Q, Lin WY, Su SF (2020) Global spatio-temporal attention for action recognition based on 3d human skeleton data. IEEE Access 8:88604\u201388616","journal-title":"IEEE Access"},{"issue":"3","key":"13441_CR9","doi-asserted-by":"publisher","first-page":"807","DOI":"10.1109\/TCSVT.2016.2628339","volume":"28","author":"Y Hou","year":"2016","unstructured":"Hou Y, Li Z, Wang P, Li W (2016) Skeleton optical spectra-based action recognition using convolutional neural networks. IEEE Trans Circ Syst Video Technol 28(3):807\u2013811","journal-title":"IEEE Trans Circ Syst Video Technol"},{"key":"13441_CR10","doi-asserted-by":"crossref","unstructured":"Hu G, Cui B, Yu S (2019) Skeleton-based action recognition with synchronous local and non-local spatio-temporal learning and frequency attention. In: 2019 IEEE International conference on multimedia and expo (ICME), pp 1216\u20131221. IEEE","DOI":"10.1109\/ICME.2019.00212"},{"key":"13441_CR11","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7132\u20137141","DOI":"10.1109\/CVPR.2018.00745"},{"key":"13441_CR12","doi-asserted-by":"crossref","unstructured":"Hu JF, Zheng WS, Lai J, Zhang J (2015) Jointly learning heterogeneous features for rgb-d activity recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5344\u20135352","DOI":"10.1109\/CVPR.2015.7299172"},{"key":"13441_CR13","doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Van Der Maaten L, Weinberger KQ (2017) Densely connected convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4700\u20134708","DOI":"10.1109\/CVPR.2017.243"},{"key":"13441_CR14","doi-asserted-by":"crossref","unstructured":"Ji Y, Xu F, Yang Y, Xie N, Shen HT, Harada T (2019) Attention transfer (ant) network for view-invariant action recognition. In: Proceedings of the 27th ACM International Conference on Multimedia, pp 574\u2013582. ACM","DOI":"10.1145\/3343031.3350959"},{"key":"13441_CR15","doi-asserted-by":"crossref","unstructured":"Kamel A, Sheng B, Yang P, Li P, Shen R, Feng DD (2018) Deep convolutional neural networks for human action recognition using depth maps and postures. IEEE Trans Syst Man Cybern Syst","DOI":"10.1109\/TSMC.2018.2850149"},{"issue":"6","key":"13441_CR16","doi-asserted-by":"publisher","first-page":"2842","DOI":"10.1109\/TIP.2018.2812099","volume":"27","author":"Q Ke","year":"2018","unstructured":"Ke Q, Bennamoun M, An S, Sohel F, Boussaid F (2018) Learning clip representations for skeleton-based 3d action recognition. IEEE Trans Image Process 27(6):2842\u20132855","journal-title":"IEEE Trans Image Process"},{"issue":"17","key":"13441_CR17","doi-asserted-by":"publisher","first-page":"22901","DOI":"10.1007\/s11042-018-5642-0","volume":"77","author":"B Li","year":"2018","unstructured":"Li B, He M, Dai Y, Cheng X, Chen Y (2018) 3d skeleton based action recognition by video-domain translation-scale invariant mapping and multi-scale dilated cnn. Multimed Tools Appl 77(17):22901\u201322921","journal-title":"Multimed Tools Appl"},{"key":"13441_CR18","doi-asserted-by":"crossref","unstructured":"Li B, Li X, Zhang Z, Wu F (2019) Spatio-temporal graph routing for skeleton-based action recognition, 33 8561\u20138568","DOI":"10.1609\/aaai.v33i01.33018561"},{"key":"13441_CR19","doi-asserted-by":"crossref","unstructured":"Li C, Wang P, Wang S, Hou Y, Li W (2017) Skeleton-based action recognition using lstm and cnn. In: 2017 IEEE International conference on multimedia & expo workshops (ICMEW), pp 585\u2013590. IEEE","DOI":"10.1109\/ICMEW.2017.8026287"},{"key":"13441_CR20","unstructured":"Li C, Zhong Q, Xie D, Pu S (2017) Skeleton-based action recognition with convolutional neural networks. In: 2017 IEEE International conference on multimedia & expo workshops (ICMEW), pp 597\u2013600. IEEE"},{"key":"13441_CR21","doi-asserted-by":"crossref","unstructured":"Li C, Zhong Q, Xie D, Pu S (2018) Co-occurrence feature learning from skeleton data for action recognition and detection with hierarchical aggregation. arXiv:http:\/\/arxiv.org\/aba\/1804.06055","DOI":"10.24963\/ijcai.2018\/109"},{"key":"13441_CR22","doi-asserted-by":"crossref","unstructured":"Li M, Chen S, Chen X, Zhang Y, Wang Y, Tian Q (2019) Actional-structural graph convolutional networks for skeleton-based action recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3595\u20133603","DOI":"10.1109\/CVPR.2019.00371"},{"key":"13441_CR23","unstructured":"Liu J, Akhtar N, Mian A (2017) Skepxels: Spatio-temporal image representation of human skeleton joints for action recognition. arXiv:http:\/\/arxiv.org\/aba\/1711.05941"},{"issue":"12","key":"13441_CR24","doi-asserted-by":"publisher","first-page":"3007","DOI":"10.1109\/TPAMI.2017.2771306","volume":"40","author":"J Liu","year":"2017","unstructured":"Liu J, Shahroudy A, Xu D, Kot AC, Wang G (2017) Skeleton-based action recognition using spatio-temporal lstm network with trust gates. IEEE Trans Pattern Anal Mach Intell 40(12):3007\u20133021","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"13441_CR25","doi-asserted-by":"crossref","unstructured":"Liu J, Wang G, Hu P, Duan LY, Kot AC (2017) Global context-aware attention lstm networks for 3d action recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1647\u20131656","DOI":"10.1109\/CVPR.2017.391"},{"key":"13441_CR26","doi-asserted-by":"crossref","unstructured":"Meng F, Liu H, Liang Y, Tu J, Liua M (2019) Sample fusion network: an end-to-end data augmentation network for skeleton-based human action recognition. IEEE Trans Image Process","DOI":"10.1109\/TIP.2019.2913544"},{"key":"13441_CR27","doi-asserted-by":"crossref","unstructured":"Nie Q, Wang J, Wang X, Liu Y (2019) View-invariant human action recognition based on a 3d bio-constrained skeleton model. IEEE Trans Image Process","DOI":"10.1109\/TIP.2019.2907048"},{"key":"13441_CR28","doi-asserted-by":"crossref","unstructured":"Shahroudy A, Liu J, Ng TT, Wang G (2016) Ntu rgb+ d: a large scale dataset for 3d human activity analysis. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1010\u20131019","DOI":"10.1109\/CVPR.2016.115"},{"key":"13441_CR29","doi-asserted-by":"crossref","unstructured":"Shi L, Zhang Y, Cheng J, Lu H (2019) Skeleton-based action recognition with directed graph neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 7912\u20137921","DOI":"10.1109\/CVPR.2019.00810"},{"key":"13441_CR30","doi-asserted-by":"crossref","unstructured":"Shi L, Zhang Y, Cheng J, Lu H (2019) Two-stream adaptive graph convolutional networks for skeleton-based action recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 12026\u201312035","DOI":"10.1109\/CVPR.2019.01230"},{"key":"13441_CR31","doi-asserted-by":"crossref","unstructured":"Si C, Jing Y, Wang W, Wang L, Tan T (2018) Skeleton-based action recognition with spatial reasoning and temporal stack learning. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 103\u2013118","DOI":"10.1007\/978-3-030-01246-5_7"},{"key":"13441_CR32","doi-asserted-by":"crossref","unstructured":"Song S, Lan C, Xing J, Zeng W, Liu J (2017) An end-to-end spatio-temporal attention model for human action recognition from skeleton data Thirty-first AAAI conference on artificial intelligence, pp 4263\u20134270","DOI":"10.1609\/aaai.v31i1.11212"},{"key":"13441_CR33","doi-asserted-by":"crossref","unstructured":"Tang Y, Tian Y, Lu J, Li P, Zhou J (2018) Deep progressive reinforcement learning for skeleton-based action recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 5323\u20135332","DOI":"10.1109\/CVPR.2018.00558"},{"key":"13441_CR34","doi-asserted-by":"crossref","unstructured":"Tu J, Liu M, Liu H (2018) Skeleton-based human action recognition using spatial temporal 3d convolutional neural networks. In: 2018 IEEE International conference on multimedia and expo (ICME), pp 1\u20136. IEEE","DOI":"10.1109\/ICME.2018.8486566"},{"issue":"9","key":"13441_CR35","doi-asserted-by":"publisher","first-page":"4382","DOI":"10.1109\/TIP.2018.2837386","volume":"27","author":"H Wang","year":"2018","unstructured":"Wang H, Wang L (2018) Beyond joints: learning representations from primitive geometries for skeleton-based action recognition and detection. IEEE Trans Image Process 27(9):4382\u20134394","journal-title":"IEEE Trans Image Process"},{"key":"13441_CR36","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.knosys.2018.05.029","volume":"158","author":"P Wang","year":"2018","unstructured":"Wang P, Li W, Li C, Hou Y (2018) Action recognition based on joint trajectory maps with convolutional neural networks. Knowl-Based Syst 158:43\u201353","journal-title":"Knowl-Based Syst"},{"key":"13441_CR37","doi-asserted-by":"crossref","unstructured":"Wang X, Girshick R, Gupta A, He K (2018) Non-local neural networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7794\u20137803","DOI":"10.1109\/CVPR.2018.00813"},{"key":"13441_CR38","doi-asserted-by":"crossref","unstructured":"Wen YH, Gao L, Fu H, Zhang FL, Xia S (2019) Graph cnns with motif and variable temporal block for skeleton-based action recognition. In: Proceedings of the AAAI conference on artificial intelligence, vol 33, pp 8989\u20138996","DOI":"10.1609\/aaai.v33i01.33018989"},{"key":"13441_CR39","doi-asserted-by":"crossref","unstructured":"Xiao R, Hou Y, Guo Z, Li C, Wang P, Li W (2019) Self-attention guided deep features for action recognition. In: 2019 IEEE International conference on multimedia and expo (ICME), pp 1060\u20131065. IEEE","DOI":"10.1109\/ICME.2019.00186"},{"key":"13441_CR40","doi-asserted-by":"crossref","unstructured":"Xie C, Li C, Zhang B, Chen C, Han J, Zou C, Liu J (2018) Memory attention networks for skeleton-based action recognition. arXiv:1804.08254","DOI":"10.24963\/ijcai.2018\/227"},{"key":"13441_CR41","doi-asserted-by":"crossref","unstructured":"Yan S, Xiong Y, Lin D (2018) Spatial temporal graph convolutional networks for skeleton-based action recognition. In: Thirty-second AAAI conference on artificial intelligence, pp 7444\u20137452","DOI":"10.1609\/aaai.v32i1.12328"},{"key":"13441_CR42","doi-asserted-by":"crossref","unstructured":"Yang Z, Li Y, Yang J, Luo J (2018) Action recognition with spatio-temporal visual attention on skeleton image sequences. IEEE Trans Circ Syst Video Technol","DOI":"10.1109\/ICPR.2018.8546012"},{"key":"13441_CR43","doi-asserted-by":"crossref","unstructured":"Yang Z, Li Y, Yang J, Luo J (2018) Action recognition with visual attention on skeleton images. In: 2018 24th international conference on pattern recognition (ICPR), pp 3309\u20133314. IEEE","DOI":"10.1109\/ICPR.2018.8546012"},{"key":"13441_CR44","doi-asserted-by":"crossref","unstructured":"Zhang H, Song Y, Zhang Y (2019) Graph convolutional lstm model for skeleton-based action recognition. In: 2019 IEEE International conference on multimedia and expo (ICME), pp 412\u2013417. IEEE","DOI":"10.1109\/ICME.2019.00078"},{"issue":"9","key":"13441_CR45","doi-asserted-by":"publisher","first-page":"2330","DOI":"10.1109\/TMM.2018.2802648","volume":"20","author":"S Zhang","year":"2018","unstructured":"Zhang S, Yang Y, Xiao J, Liu X, Yang Y, Xie D, Zhuang Y (2018) Fusing geometric features for skeleton-based action recognition using multilayer lstm networks. IEEE Trans Multimed 20(9):2330\u20132343","journal-title":"IEEE Trans Multimed"},{"key":"13441_CR46","doi-asserted-by":"crossref","unstructured":"Zhao R, Wang K, Su H, Ji Q (2019) Bayesian graph convolution lstm for skeleton based action recognition. In: Proceedings of the IEEE international conference on computer vision, pp 6882\u20136892","DOI":"10.1109\/ICCV.2019.00698"},{"key":"13441_CR47","doi-asserted-by":"crossref","unstructured":"Zhao R, Xu W, Su H, Ji Q (2019) Bayesian hierarchical dynamic model for human action recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7733\u20137742","DOI":"10.1109\/CVPR.2019.00792"},{"key":"13441_CR48","doi-asserted-by":"crossref","unstructured":"Zheng W, Li L, Zhang Z, Huang Y, Wang L (2019) Relational network for skeleton-based action recognition. In: 2019 IEEE International conference on multimedia and expo (ICME), pp 826\u2013831. IEEE","DOI":"10.1109\/ICME.2019.00147"},{"key":"13441_CR49","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1016\/j.neucom.2019.08.043","volume":"370","author":"J Zhu","year":"2019","unstructured":"Zhu J, Zou W, Zhu Z, Hu Y (2019) Convolutional relation network for skeleton-based action recognition. Neurocomputing 370:109\u2013117","journal-title":"Neurocomputing"},{"key":"13441_CR50","doi-asserted-by":"crossref","unstructured":"Zhu K, Wang R, Zhao Q, Cheng J, Tao D (2019) A cuboid cnn model with an attention mechanism for skeleton-based action recognition. IEEE Trans Multimed","DOI":"10.1109\/TMM.2019.2962304"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13441-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-13441-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-13441-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T04:50:36Z","timestamp":1727671836000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-13441-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7,29]]},"references-count":50,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,1]]}},"alternative-id":["13441"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-13441-7","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,7,29]]},"assertion":[{"value":"11 January 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 May 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 July 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 July 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}