{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,22]],"date-time":"2025-11-22T11:22:56Z","timestamp":1763810576093,"version":"build-2065373602"},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,1,10]]},"DOI":"10.1109\/icpr48806.2021.9412742","type":"proceedings-article","created":{"date-parts":[[2021,5,6]],"date-time":"2021-05-06T02:15:54Z","timestamp":1620267354000},"page":"6019-6026","source":"Crossref","is-referenced-by-count":7,"title":["3D attention mechanism for fine-grained classification of table tennis strokes using a Twin Spatio-Temporal Convolutional Neural Networks"],"prefix":"10.1109","author":[{"given":"Pierre-Etienne","family":"Martin","sequence":"first","affiliation":[]},{"given":"Jenny","family":"Benois-Pineau","sequence":"additional","affiliation":[]},{"given":"Renaud","family":"Peteri","sequence":"additional","affiliation":[]},{"given":"Julien","family":"Morlier","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.213"},{"key":"ref38","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"NIPS"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00817"},{"key":"ref30","article-title":"Multiple moving object detection for fast video content description in compressed domain","volume":"2008","author":"manerba","year":"2008","journal-title":"EURASIP J Adv Sig Proc"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2019.8803780"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126543"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D16-1053"},{"key":"ref34","article-title":"Very deep convolutional networks for large-scale image recognition","volume":"abs 1409 1556","author":"simonyan","year":"2014","journal-title":"CoRR"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00269"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2706685"},{"key":"ref11","first-page":"1","article-title":"Forward-backward visual saliency propagation in deep nns vs internal attentional mechanisms","author":"obeso","year":"0","journal-title":"Ipta"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.683"},{"key":"ref13","article-title":"UCF101: A dataset of 101 human actions classes from videos in the wild","volume":"1212 402","author":"soomro","year":"2012","journal-title":"CoRR"},{"key":"ref14","article-title":"The kinetics human action video dataset","volume":"abs 1705 6950","author":"kay","year":"2017","journal-title":"CoRR"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2019.2934630"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3390\/s20020333"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW50498.2020.00450"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CBMI.2018.8516488"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-020-08917-3"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01270-0_23"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2712608"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2019.00103"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2778011"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2015.2475835"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01017"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref7","article-title":"Slowfast networks for video recognition","volume":"abs 1812 3982","author":"feichtenhofer","year":"2018","journal-title":"CoRR"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2691768"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00718"},{"key":"ref1","article-title":"AVA: A video dataset of spatio-temporally localized atomic visual actions","volume":"abs 1705 8421","author":"gu","year":"2017","journal-title":"CoRR"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.391"},{"key":"ref45","first-page":"448","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","volume":"37","author":"ioffe","year":"0","journal-title":"ICML"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2913372"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-019-01733-3"},{"key":"ref42","first-page":"1139","article-title":"On the importance of initialization and momentum in deep learning","volume":"28","author":"sutskever","year":"2013","journal-title":"Proceedings of the 30th International Conference on Machine Learning ICML 2013"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2019.00061"},{"journal-title":"Beyond pixels Exploring new representations and applications for motion analysis","year":"2009","author":"liu","key":"ref41"},{"key":"ref23","first-page":"352","article-title":"A2-Nets: Double Attention Networks","author":"chen","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref44","article-title":"Deep residual learning for image recognition","volume":"abs 1512 3385","author":"he","year":"2015","journal-title":"CoRR"},{"key":"ref26","first-page":"108","article-title":"Multimodal network embedding via attention based multi-view variational autoen-coder","author":"huang","year":"0","journal-title":"ICMR"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-27863-6_74"},{"key":"ref25","article-title":"Paying more attention to attention: Improving the performance of convolutional neural networks via attention transfer","author":"zagoruyko","year":"2017","journal-title":"ICLR (Poster)"}],"event":{"name":"2020 25th International Conference on Pattern Recognition (ICPR)","start":{"date-parts":[[2021,1,10]]},"location":"Milan, Italy","end":{"date-parts":[[2021,1,15]]}},"container-title":["2020 25th International Conference on Pattern Recognition (ICPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9411940\/9411911\/09412742.pdf?arnumber=9412742","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T15:40:54Z","timestamp":1652197254000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9412742\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,10]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/icpr48806.2021.9412742","relation":{},"subject":[],"published":{"date-parts":[[2021,1,10]]}}}