{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,10]],"date-time":"2026-06-10T15:57:31Z","timestamp":1781107051836,"version":"3.54.1"},"reference-count":34,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/100018693","name":"Horizon 2020","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100018693","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Robotics and Autonomous Systems"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.robot.2026.105518","type":"journal-article","created":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T23:29:27Z","timestamp":1778282967000},"page":"105518","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["A time and object aware transformer-based method for structured hierarchical gesture recognition"],"prefix":"10.1016","volume":"203","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-0098-0013","authenticated-orcid":false,"given":"Athanasios","family":"Papanikolaou","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Vladimir","family":"Sivtsov","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Muslim","family":"Alaran","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Daniil","family":"Shkolnik","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Enrica","family":"Zereik","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ivan","family":"Markovic","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ivan","family":"Petrovic","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Fabio","family":"Bonsignorio","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"issue":"1","key":"10.1016\/j.robot.2026.105518_b1","doi-asserted-by":"crossref","first-page":"135","DOI":"10.3390\/app12010135","article-title":"Advanced applications of industrial robotics: New trends and possibilities","volume":"12","author":"Dzedzickis","year":"2021","journal-title":"Appl. Sci."},{"key":"10.1016\/j.robot.2026.105518_b2","doi-asserted-by":"crossref","first-page":"162","DOI":"10.1016\/j.robot.2019.03.003","article-title":"Cobot programming for collaborative industrial tasks: An overview","volume":"116","author":"El Zaatari","year":"2019","journal-title":"Robot. Auton. Syst."},{"issue":"3","key":"10.1016\/j.robot.2026.105518_b3","doi-asserted-by":"crossref","first-page":"654","DOI":"10.1177\/0954405419883060","article-title":"A case study in human-robot collaboration in the disassembly of press-fitted components","volume":"234","author":"Huang","year":"2019","journal-title":"Proc. Inst. Mech. Eng. B"},{"key":"10.1016\/j.robot.2026.105518_b4","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1016\/j.resconrec.2017.06.022","article-title":"Ease of disassembly of products to support circular economy strategies","volume":"135","author":"Vanegas","year":"2018","journal-title":"Resour. Conserv. Recycl."},{"key":"10.1016\/j.robot.2026.105518_b5","doi-asserted-by":"crossref","first-page":"1115","DOI":"10.1109\/OJIES.2024.3453900","article-title":"A functional and practical taxonomy for the industrial implementation of highly automated reverse manufacturing cells","volume":"5","author":"Morachioli","year":"2024","journal-title":"IEEE Open J. Ind. Electron. Soc."},{"key":"10.1016\/j.robot.2026.105518_b6","unstructured":"Vladimir Sivtsov, Athanasios Papanikolaou, Annagiulia Morachioli, Ivan Markovic, Ivan Petrovic, Enrica Zereik, Fabio Bonsignorio, Action Primitives for Bimanual Robotic Disassembly Cell of Printer Cartridges, in: Proceedings of the 10th IFAC Symposium on Mechatronic Systems (MECHATRONICS 2025) and the 14th IFAC Symposium on Robotics (ROBOTICS 2025), Paris, France, 2025, pp. 560\u2013562."},{"key":"10.1016\/j.robot.2026.105518_b7","unstructured":"Athanasios Papanikolaou, Vladimir Sivtsov, Annagiulia Morachioli, Ivan Markovic, Ivan Petrovic, Enrica Zereik, Fabio Bonsignorio, Design of a Bimanual Disassembly Cell for the Cartridge Substitution of an Off-the-Shelf Office Printer, in: Proceedings of the 10th IFAC Symposium on Mechatronic Systems (MECHATRONICS 2025) and the 14th IFAC Symposium on Robotics (ROBOTICS 2025), Paris, France, 2025, pp. 563\u2013566."},{"key":"10.1016\/j.robot.2026.105518_b8","doi-asserted-by":"crossref","DOI":"10.3389\/fnbot.2023.1320251","article-title":"Peg-in-hole assembly skill imitation learning method based on ProMPs under task geometric representation","volume":"17","author":"Zang","year":"2023","journal-title":"Front. Neurorobotics"},{"issue":"3","key":"10.1016\/j.robot.2026.105518_b9","doi-asserted-by":"crossref","first-page":"331","DOI":"10.1007\/s41095-022-0271-y","article-title":"Attention mechanisms in computer vision: A survey","volume":"8","author":"Guo","year":"2022","journal-title":"Comput. Vis. Media"},{"issue":"2","key":"10.1016\/j.robot.2026.105518_b10","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3054912","article-title":"Imitation learning: A survey of learning methods","volume":"50","author":"Hussein","year":"2017","journal-title":"ACM Comput. Surv."},{"issue":"1","key":"10.1016\/j.robot.2026.105518_b11","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1007\/s41315-022-00262-y","article-title":"An imitation learning approach for the control of a low-cost low-accuracy robotic arm for unstructured environments","volume":"7","author":"Bonsignorio","year":"2023","journal-title":"Int. J. Intell. Robot. Appl."},{"issue":"12","key":"10.1016\/j.robot.2026.105518_b12","doi-asserted-by":"crossref","first-page":"4027","DOI":"10.1080\/00207543.2019.1578906","article-title":"Human-robot collaboration in disassembly for sustainable manufacturing","volume":"57","author":"Liu","year":"2019","journal-title":"Int. J. Prod. Res."},{"key":"10.1016\/j.robot.2026.105518_b13","series-title":"2021 IEEE 7th International Conference on Virtual Reality","first-page":"246","article-title":"Research on gesture recognition and interaction of virtual collaborative disassembly training","author":"Hu","year":"2021"},{"key":"10.1016\/j.robot.2026.105518_b14","series-title":"Therbligs in action: Video understanding through motion primitives","author":"Dessalene","year":"2023"},{"issue":"1","key":"10.1016\/j.robot.2026.105518_b15","doi-asserted-by":"crossref","first-page":"49","DOI":"10.47982\/spool.2024.1.03","article-title":"Therblig to robot: Action packages, robot motion and Human-Robot collaboration in domestic environments","volume":"11","author":"Reinhardt","year":"2024","journal-title":"Spool"},{"key":"10.1016\/j.robot.2026.105518_b16","series-title":"Proceedings of the 38th International Conference on Machine Learning, ICML 2021, 18-24 July 2021, Virtual Event","first-page":"813","article-title":"Is Space-Time attention all you need for video understanding?","volume":"Vol. 139","author":"Bertasius","year":"2021"},{"key":"10.1016\/j.robot.2026.105518_b17","doi-asserted-by":"crossref","unstructured":"Anurag Arnab, Mostafa Dehghani, Georg Heigold, Chen Sun, Mario Lu\u010di\u0107, Cordelia Schmid, ViViT: A Video Vision Transformer, in: 2021 IEEE\/CVF International Conference on Computer Vision, ICCV, 2021, pp. 6816\u20136826.","DOI":"10.1109\/ICCV48922.2021.00676"},{"key":"10.1016\/j.robot.2026.105518_b18","doi-asserted-by":"crossref","unstructured":"Jo\u00e3o Carreira, Andrew Zisserman, Quo Vadis, Action Recognition? A New Model and the Kinetics Dataset, in: 2017 IEEE Conference on Computer Vision and Pattern Recognition, CVPR, 2017, pp. 4724\u20134733.","DOI":"10.1109\/CVPR.2017.502"},{"key":"10.1016\/j.robot.2026.105518_b19","doi-asserted-by":"crossref","unstructured":"Dian Shao, Yue Zhao, Bo Dai, Dahua Lin, FineGym: A Hierarchical Video Dataset for Fine-Grained Action Understanding, in: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR, 2020, pp. 2613\u20132622.","DOI":"10.1109\/CVPR42600.2020.00269"},{"key":"10.1016\/j.robot.2026.105518_b20","article-title":"Hierarchical motion understanding via motion programs","author":"Kulal","year":"2021","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.robot.2026.105518_b21","doi-asserted-by":"crossref","unstructured":"Dan Kondratyuk, Liangzhe Yuan, Yandong Li, Li Zhang, Mingxing Tan, Matthew Brown, Boqing Gong, MoViNets: Mobile Video Networks for Efficient Video Recognition, in: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR, 2021, pp. 16015\u201316025.","DOI":"10.1109\/CVPR46437.2021.01576"},{"issue":"2","key":"10.1016\/j.robot.2026.105518_b22","doi-asserted-by":"crossref","DOI":"10.1007\/s10462-023-10650-w","article-title":"Overview of temporal action detection based on deep learning","volume":"57","author":"Hu","year":"2024","journal-title":"Artif. Intell. Rev."},{"issue":"5","key":"10.1016\/j.robot.2026.105518_b23","doi-asserted-by":"crossref","first-page":"1694","DOI":"10.3390\/s22051694","article-title":"Real-Time analysis of hand gesture recognition with temporal convolutional networks","volume":"22","author":"Tsinganos","year":"2022","journal-title":"Sensors"},{"issue":"2","key":"10.1016\/j.robot.2026.105518_b24","first-page":"1451","article-title":"SMART frame selection for action recognition","volume":"35","author":"Gowda","year":"2021","journal-title":"Proc. AAAI Conf. Artif. Intell."},{"key":"10.1016\/j.robot.2026.105518_b25","series-title":"MediaPipe hands: On-device Real-time hand tracking","author":"Zhang","year":"2020"},{"issue":"1","key":"10.1016\/j.robot.2026.105518_b26","doi-asserted-by":"crossref","DOI":"10.1186\/1687-6180-2012-36","article-title":"3D hand tracking using Kalman filter in depth space","volume":"2012","author":"Park","year":"2012","journal-title":"EURASIP J. Adv. Signal Process."},{"key":"10.1016\/j.robot.2026.105518_b27","doi-asserted-by":"crossref","unstructured":"Qiushi Fu, Marco Santello, Tracking whole hand kinematics using extended Kalman filter, in: 2010 Annual International Conference of the IEEE Engineering in Medicine and Biology, 2010, pp. 4606\u20134609.","DOI":"10.1109\/IEMBS.2010.5626513"},{"key":"10.1016\/j.robot.2026.105518_b28","series-title":"Ultralytics YOLOv5","author":"Jocher","year":"2020"},{"key":"10.1016\/j.robot.2026.105518_b29","unstructured":"Athanasios Papanikolaou, Vladimir Sivtsov, Daniil Shkolnik, Enrica Zereik, Ivan Markovic, Ivan Petrovic, Fabio Bonsignorio, A Transformer-Based Pipeline for Efficient Hand Gesture Recognition, in: Proceedings of the Intelligent Autonomous Systems 19 Conference, 2025."},{"issue":"3","key":"10.1016\/j.robot.2026.105518_b30","doi-asserted-by":"crossref","first-page":"674","DOI":"10.3390\/s25030674","article-title":"A posture training system based on therblig analysis and YOLO Model-Taking erhu bowing as an example","volume":"25","author":"Lu","year":"2025","journal-title":"Sensors"},{"key":"10.1016\/j.robot.2026.105518_b31","series-title":"AugMix: A simple data processing method to improve robustness and uncertainty","author":"Hendrycks","year":"2020"},{"key":"10.1016\/j.robot.2026.105518_b32","series-title":"Pattern Recognition and Machine Learning","author":"Bishop","year":"2006"},{"key":"10.1016\/j.robot.2026.105518_b33","series-title":"Probabilistic Graphical Models: Principles and Techniques","author":"Koller","year":"2009"},{"issue":"6","key":"10.1016\/j.robot.2026.105518_b34","doi-asserted-by":"crossref","first-page":"6647","DOI":"10.1109\/TPAMI.2020.3021756","article-title":"MS-TCN++: Multi-Stage temporal convolutional network for action segmentation","volume":"45","author":"Li","year":"2023","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."}],"container-title":["Robotics and Autonomous Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0921889026001910?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0921889026001910?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,10]],"date-time":"2026-06-10T15:02:38Z","timestamp":1781103758000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0921889026001910"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":34,"alternative-id":["S0921889026001910"],"URL":"https:\/\/doi.org\/10.1016\/j.robot.2026.105518","relation":{},"ISSN":["0921-8890"],"issn-type":[{"value":"0921-8890","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"A time and object aware transformer-based method for structured hierarchical gesture recognition","name":"articletitle","label":"Article Title"},{"value":"Robotics and Autonomous Systems","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.robot.2026.105518","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"105518"}}