{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T03:39:59Z","timestamp":1761709199773},"reference-count":29,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/wacv.2016.7477589","type":"proceedings-article","created":{"date-parts":[[2016,5,26]],"date-time":"2016-05-26T20:27:33Z","timestamp":1464294453000},"source":"Crossref","is-referenced-by-count":110,"title":["Combining multiple sources of knowledge in deep CNNs for action recognition"],"prefix":"10.1109","author":[{"given":"Eunbyung","family":"Park","sequence":"first","affiliation":[]},{"given":"Xufeng","family":"Han","sequence":"additional","affiliation":[]},{"given":"Tamara L.","family":"Berg","sequence":"additional","affiliation":[]},{"given":"Alexander C.","family":"Berg","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref11","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"NIPS"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126543"},{"key":"ref13","article-title":"Beyond gaussian pyramid: Multi-skip feature stacking for action recognition","author":"lan","year":"2015","journal-title":"CVPR"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.170"},{"key":"ref15","article-title":"Fully convolutional networks for semantic segmentation","author":"long","year":"2015","journal-title":"CVPR"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298778"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref18","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"NIPS"},{"key":"ref19","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2015","journal-title":"ICLRE"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299101"},{"key":"ref4","article-title":"Matchnet: Unifying feature and metric learning for patch-based matching","author":"han","year":"2015","journal-title":"CVPR"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806222"},{"key":"ref3","article-title":"Learning rich features from RGB-D images for object detection and segmentation","author":"gupta","year":"2014","journal-title":"ECCV"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.5244\/C.29.60"},{"key":"ref5","article-title":"Improving neural networks by preventing co-adaptation of feature detectors","author":"hinton","year":"2012","journal-title":"arXiv preprint arXiv 1207 0580"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.59"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref9","article-title":"Exploiting feature and class relationships in video categorization with regularized deep neural networks","author":"jiang","year":"2015","journal-title":"arXiv preprint arXiv 1502 01032"},{"key":"ref1","article-title":"Long-term recurrent convolutional networks for visual recognition and description","author":"donahue","year":"2015","journal-title":"CVPR"},{"key":"ref20","article-title":"Learning and selecting features jointly with point-wise gated boltzmann machines","author":"sohn","year":"2013","journal-title":"ICML"},{"key":"ref22","article-title":"Generating text with recurrent neural networks","author":"sutskever","year":"2011","journal-title":"ICML"},{"key":"ref21","article-title":"UCF101: A dataset of 101 human actions classes from videos in the wild","author":"soomro","year":"2012","journal-title":"arXiv preprint arXiv 1212 0402"},{"key":"ref24","article-title":"C3D: generic features for video analysis","author":"tran","year":"2014","journal-title":"arXiv preprint arXiv 1412 0767"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1162\/089976600300015349"},{"key":"ref26","article-title":"Action recognition with trajectory-pooled deep-convolutional descriptors","author":"wang","year":"2015","journal-title":"CVPR"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.441"}],"event":{"name":"2016 IEEE Winter Conference on Applications of Computer Vision (WACV)","location":"Lake Placid, NY, USA","start":{"date-parts":[[2016,3,7]]},"end":{"date-parts":[[2016,3,10]]}},"container-title":["2016 IEEE Winter Conference on Applications of Computer Vision (WACV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7469250\/7477446\/07477589.pdf?arnumber=7477589","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2016,9,23]],"date-time":"2016-09-23T20:07:42Z","timestamp":1474661262000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7477589\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/wacv.2016.7477589","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}