{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T16:42:02Z","timestamp":1765039322499,"version":"3.28.0"},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,7]]},"DOI":"10.1109\/ijcnn.2016.7727435","type":"proceedings-article","created":{"date-parts":[[2016,11,8]],"date-time":"2016-11-08T21:15:56Z","timestamp":1478639756000},"page":"1924-1931","source":"Crossref","is-referenced-by-count":13,"title":["Exploring multimodal video representation for action recognition"],"prefix":"10.1109","author":[{"family":"Cheng Wang","sequence":"first","affiliation":[]},{"family":"Haojin Yang","sequence":"additional","affiliation":[]},{"given":"Christoph","family":"Meinel","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref31","article-title":"Unsupervised learning of video representations using lstms","author":"srivastava","year":"2015","journal-title":"CoRR vol absI1502 04681"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.59"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.5244\/C.26.124"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref13","first-page":"689","article-title":"Multimodal deep learning","author":"ngiam","year":"2011","journal-title":"Proceedings of the 28th International Conference on Machine Learning (ICML-11)"},{"key":"ref14","first-page":"2222","article-title":"Multimodallearning with deep boltzmann machines","author":"srivastava","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459154"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.83"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"428","DOI":"10.1007\/11744047_33","article-title":"Human detection using oriented histograms of flow and appearance","author":"dalal","year":"2006","journal-title":"Computer Vision-ECCV 2006"},{"key":"ref18","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"818","DOI":"10.1007\/978-3-319-10590-1_53","article-title":"Visualizing and understanding convolutional networks","author":"zeiler","year":"2014","journal-title":"Computer Vision-ECCV 2014"},{"key":"ref28","first-page":"25","article-title":"High accuracy optical flow estimation based on a theory for warping","volume":"3024","author":"brox","year":"2004","journal-title":"Proceedings of ECCV"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1007\/978-3-642-15561-1_11","article-title":"Improving the fisher kernel for large-scale image classification","author":"perronnin","year":"2010","journal-title":"Computer Vision-ECCV 2010"},{"key":"ref27","article-title":"Ucfl01: A dataset of 101 human actions classes from videos in the wild","author":"soomro","year":"2012","journal-title":"arXiv preprint arXiv 1212 0402"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.441"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587731"},{"key":"ref29","article-title":"Towards good practices for very deep two-stream convnets","author":"wang","year":"2015","journal-title":"arXiv preprint arXiv 1507 02159"},{"key":"ref5","article-title":"Bag of visual words and fusion methods for action recognition: Comprehensive study and good practice","author":"peng","year":"2014","journal-title":"arXiv preprint arXiv 1405 4506"},{"key":"ref8","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2011.157"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995407"},{"key":"ref9","article-title":"Long-term recurrent convolutional networks for visual recognition and description","author":"donahue","year":"2014","journal-title":"arXiv preprint arXiv 1411 4389"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1109\/CVPR.2008.4587756","article-title":"Learning realistic human actions from movies","author":"laptev","year":"2008","journal-title":"Computer Vision and Pattern Recognition 2008 CVPR 2008 IEEE Conference"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.330"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s00530-010-0182-0"},{"key":"ref21","first-page":"1341","article-title":"Submodular attribute selection for action recognition in video","author":"zheng","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref24","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"CoRR vol abs\/1409 1556"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.109"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654931"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"}],"event":{"name":"2016 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2016,7,24]]},"location":"Vancouver, BC, Canada","end":{"date-parts":[[2016,7,29]]}},"container-title":["2016 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7593175\/7726591\/07727435.pdf?arnumber=7727435","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,15]],"date-time":"2019-09-15T11:20:11Z","timestamp":1568546411000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7727435\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,7]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/ijcnn.2016.7727435","relation":{},"subject":[],"published":{"date-parts":[[2016,7]]}}}