{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T09:24:56Z","timestamp":1780392296991,"version":"3.54.1"},"reference-count":90,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"am","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100002341","name":"Academy of Finland for project MiGA","doi-asserted-by":"publisher","award":["316765"],"award-info":[{"award-number":["316765"]}],"id":[{"id":"10.13039\/501100002341","id-type":"DOI","asserted-by":"publisher"}]},{"name":"ICT 2023 Project","award":["328115"],"award-info":[{"award-number":["328115"]}]},{"DOI":"10.13039\/501100018948","name":"Infotech Oulu","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100018948","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"Chinese National Natural Science Foundation","doi-asserted-by":"publisher","award":["61961160704"],"award-info":[{"award-number":["61961160704"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"Chinese National Natural Science Foundation","doi-asserted-by":"publisher","award":["61876179"],"award-info":[{"award-number":["61876179"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Science and Technology Development Fund of Macau","award":["0010\/2019\/AFJ"],"award-info":[{"award-number":["0010\/2019\/AFJ"]}]},{"name":"Science and Technology Development Fund of Macau","award":["0025\/2019\/AKP"],"award-info":[{"award-number":["0025\/2019\/AKP"]}]},{"DOI":"10.13039\/501100002367","name":"External Cooperation Key Project of Chinese Academy Sciences","doi-asserted-by":"publisher","award":["173211KYSB20200002"],"award-info":[{"award-number":["173211KYSB20200002"]}],"id":[{"id":"10.13039\/501100002367","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Image Process."],"published-print":{"date-parts":[[2021]]},"DOI":"10.1109\/tip.2021.3087348","type":"journal-article","created":{"date-parts":[[2021,6,14]],"date-time":"2021-06-14T20:09:25Z","timestamp":1623701365000},"page":"5626-5640","source":"Crossref","is-referenced-by-count":111,"title":["Searching Multi-Rate and Multi-Modal Temporal Enhanced Networks for Gesture Recognition"],"prefix":"10.1109","volume":"30","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6505-3304","authenticated-orcid":false,"given":"Zitong","family":"Yu","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4883-5552","authenticated-orcid":false,"given":"Benjia","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4735-2885","authenticated-orcid":false,"given":"Jun","family":"Wan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1430-0237","authenticated-orcid":false,"given":"Pichao","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3267-2664","authenticated-orcid":false,"given":"Haoyu","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2242-6139","authenticated-orcid":false,"given":"Xin","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Stan Z.","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3694-206X","authenticated-orcid":false,"given":"Guoying","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref73","first-page":"1","article-title":"Learning adaptive hidden layers for mobile gesture recognition","author":"hu","year":"2018","journal-title":"Proc AAAI"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.638"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-24673-2_3"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2019.112829"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58565-5_39"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2684186"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00504"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.3390\/s20113305"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01225-0_18"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2019.00349"},{"key":"ref79","first-page":"1","article-title":"Real-time hand gesture detection and classification using convolutional neural networks","author":"k\u00f6p\u00fckl\u00fc","year":"2019","journal-title":"Proc FG"},{"key":"ref33","first-page":"1","article-title":"Cooperative training of deep aggregation networks for RGB-D action recognition","author":"wang","year":"2018","journal-title":"Proc AAAI"},{"key":"ref32","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Proc NeurIPS"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.361"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2017.01.035"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00677"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2919764"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00685"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref60","article-title":"NAS-FAS: Static-dynamic central difference network search for face anti-spoofing","author":"yu","year":"2020","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref62","first-page":"2902","article-title":"Large-scale evolution of image classifiers","author":"real","year":"2017","journal-title":"Proc ICML"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33014780"},{"key":"ref63","first-page":"1","article-title":"ProxylessNAS: Direct neural architecture search on target task and hardware","author":"cai","year":"2019","journal-title":"Proc ICLR"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2012.6239185"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2019.8802919"},{"key":"ref27","first-page":"2549","article-title":"One-shot learning gesture recognition from RGB-D data using bag of features","volume":"14","author":"wan","year":"2013","journal-title":"J Mach Learn Res"},{"key":"ref65","article-title":"Scheduled differentiable architecture search for visual recognition","author":"qiu","year":"2019","journal-title":"arXiv 1909 10236"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58598-3_27"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2513479"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2020.102942"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i03.5652"},{"key":"ref69","article-title":"MixConv: Mixed depthwise convolutional kernels","author":"tan","year":"2019","journal-title":"arXiv 1907 09595"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2016.100"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.456"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2019.00029"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2912357"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref24","first-page":"1","article-title":"AssembleNet: Searching for multi-stream neural connectivity in video architectures","author":"ryoo","year":"2020","journal-title":"Proc ICLR"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00713"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.23.2.023017"},{"key":"ref25","article-title":"ChaLearn looking at people: IsoGD and ConGD large-scale RGB-D gesture recognition","author":"wan","year":"2019","journal-title":"arXiv 1907 12193"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2016.7899601"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.369"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126543"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2020.3007086"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053587"},{"key":"ref57","first-page":"1","article-title":"PC-DARTS: Partial channel connections for memory-efficient architecture search","author":"xu","year":"2019","journal-title":"Proc ICLR"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00907"},{"key":"ref55","first-page":"1","article-title":"Neural architecture search with reinforcement learning","author":"zoph","year":"2017","journal-title":"Proc ICLR"},{"key":"ref54","first-page":"4095","article-title":"Efficient neural architecture search via parameters sharing","author":"pham","year":"2018","journal-title":"Proc ICML"},{"key":"ref53","first-page":"1","article-title":"Darts: Differentiable architecture search","author":"liu","year":"2019","journal-title":"Proc ICLR"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00186"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00126"},{"key":"ref11","first-page":"1953","article-title":"Attention in convolutional LSTM for gesture recognition","author":"zhang","year":"2018","journal-title":"Proc NeurIPS"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00534"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00151"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01249-6_24"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01018"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00630"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/3DV50981.2020.00072"},{"key":"ref16","first-page":"712","article-title":"Dynamic temporal pyramid network: A closer look at multi-scale modeling for activity detection","author":"zhang","year":"2018","journal-title":"Proc Asian Conf Comput Vis"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2019.00040"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.226"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2875441"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2461544"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.108"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-57021-1_16"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0846-5"},{"key":"ref89","article-title":"UCF101: A dataset of 101 human actions classes from videos in the wild","author":"soomro","year":"2012","journal-title":"arXiv 1212 0402"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2808769"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2014.2337331"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-012-9356-9"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.1999.832699"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2020.114499"},{"key":"ref8","first-page":"25","article-title":"Large-scale gesture recognition with a fusion of RGB-D data based on the C3D model","author":"li","year":"2016","journal-title":"Proc ICPR"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.5244\/C.23.124"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.360"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3131343"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587756"},{"key":"ref88","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"arXiv 1409 1556"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.371"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-020-08747-3"},{"key":"ref45","article-title":"3D skeletal gesture recognition via discriminative coding on time-warping invariant Riemannian trajectories","author":"liu","year":"2020","journal-title":"IEEE Trans Multimedia"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2749509"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2718189"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00549"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW50498.2020.00333"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.2974061"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2017.12.003"}],"container-title":["IEEE Transactions on Image Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/83\/9263394\/09454270.pdf?arnumber=9454270","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,17]],"date-time":"2022-01-17T18:38:22Z","timestamp":1642444702000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9454270\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"references-count":90,"URL":"https:\/\/doi.org\/10.1109\/tip.2021.3087348","relation":{},"ISSN":["1057-7149","1941-0042"],"issn-type":[{"value":"1057-7149","type":"print"},{"value":"1941-0042","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]}}}