{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T00:10:54Z","timestamp":1730247054653,"version":"3.28.0"},"reference-count":26,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,10]]},"DOI":"10.1109\/icip40778.2020.9190996","type":"proceedings-article","created":{"date-parts":[[2020,9,30]],"date-time":"2020-09-30T16:45:18Z","timestamp":1601484318000},"page":"1761-1765","source":"Crossref","is-referenced-by-count":9,"title":["Attention Boosted Deep Networks For Video Classification"],"prefix":"10.1109","author":[{"given":"Junyong","family":"You","sequence":"first","affiliation":[]},{"given":"Jari","family":"Korhonen","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806222"},{"key":"ref11","article-title":"Neural Machine Translation by Jointly Learning to Align and Translate","author":"bahdanau","year":"2015","journal-title":"Proc ICLR&#x2019;205"},{"key":"ref12","article-title":"Show, Attend and Tell: Neural Image Caption Generation with Visual Attention","author":"xu","year":"2015","journal-title":"Proc ICML&#x2019;2015"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1174"},{"key":"ref14","article-title":"Forward-backward Visual Saliency Propagation in Deep NNs vs Internal Attentional Mechanisms","author":"obeso","year":"2019","journal-title":"Proc IPTA&#x2019;2019"},{"key":"ref15","article-title":"An End-to-End Spatio-Temporal Attention Model for Human Action Recognition from Skeleton Data","author":"song","year":"2017","journal-title":"Proc AAAI&#x2019;2017"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2818328"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2018.07.034"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref19","article-title":"Very Deep Convolutional Networks for Large-Scale Image Recognition","author":"simonyan","year":"2015","journal-title":"Proc ICLR&#x2019;2015"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","article-title":"Deep Learning","volume":"521","author":"lecun","year":"2015","journal-title":"Nature"},{"key":"ref6","article-title":"Two-Stream Convolutional Networks for Action Recognition in Videos","author":"simonyan","year":"2014","journal-title":"Proc NIPS&#x2019;2014"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.590"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.59"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2010.02.001"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCC.2008.919173"},{"key":"ref9","article-title":"Beyond Short Snippets: Deep Networks for Video Classification","author":"ng","year":"2015","journal-title":"Proc CVPR&#x2019;2015"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref24","article-title":"UCF101: A Dataset of 101 Human Action Classes From Videos in The Wild","author":"soomro","year":"2012","journal-title":"CRCV-TR-12-01"},{"journal-title":"Implementation of the proposed networks available","year":"0","author":"you","key":"ref23"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1037\/0096-3445.133.3.339"},{"journal-title":"Sports-1M dataset","year":"0","key":"ref25"}],"event":{"name":"2020 IEEE International Conference on Image Processing (ICIP)","start":{"date-parts":[[2020,10,25]]},"location":"Abu Dhabi, United Arab Emirates","end":{"date-parts":[[2020,10,28]]}},"container-title":["2020 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9184803\/9190635\/09190996.pdf?arnumber=9190996","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T20:12:54Z","timestamp":1656360774000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9190996\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/icip40778.2020.9190996","relation":{},"subject":[],"published":{"date-parts":[[2020,10]]}}}