{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T17:30:34Z","timestamp":1772040634998,"version":"3.50.1"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1109\/vcip.2018.8698697","type":"proceedings-article","created":{"date-parts":[[2019,4,25]],"date-time":"2019-04-25T22:47:33Z","timestamp":1556232453000},"page":"1-4","source":"Crossref","is-referenced-by-count":3,"title":["Multi-task CNN Model for Action Detection"],"prefix":"10.1109","author":[{"given":"Xin","family":"Chen","sequence":"first","affiliation":[]},{"given":"Yahong","family":"Han","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.362"},{"key":"ref12","first-page":"391","article-title":"Edge boxes: Locating object proposals from edges","author":"zitnick","year":"2014","journal-title":"European Conference on Computer Vision"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.620"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.690"},{"key":"ref15","first-page":"25","article-title":"High accuracy optical flow estimation based on a theory for warping","author":"brox","year":"2004","journal-title":"European Conference on Computer Vision"},{"key":"ref16","article-title":"Ucf101: A dataset of 101 human actions classes from videos in the wild","author":"soomro","year":"2012"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.396"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.5244\/C.30.58"},{"key":"ref4","first-page":"91","article-title":"Faster r-cnn: Towards real-time object detection with region proposal networks","author":"ren","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref3","first-page":"21","article-title":"Ssd: Single shot multibox detector","author":"liu","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.393"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_45"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.472"},{"key":"ref7","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298676"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.341"},{"key":"ref9","article-title":"Hyperface: A deep multitask learning framework for face detection, landmark localization, pose estimation, and gender recognition","author":"ranjan","year":"2017","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"}],"event":{"name":"2018 IEEE Visual Communications and Image Processing (VCIP)","location":"Taichung, Taiwan","start":{"date-parts":[[2018,12,9]]},"end":{"date-parts":[[2018,12,12]]}},"container-title":["2018 IEEE Visual Communications and Image Processing (VCIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8694905\/8698608\/08698697.pdf?arnumber=8698697","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,13]],"date-time":"2019-05-13T19:01:07Z","timestamp":1557774067000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8698697\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,12]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/vcip.2018.8698697","relation":{},"subject":[],"published":{"date-parts":[[2018,12]]}}}