{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T00:34:22Z","timestamp":1778891662021,"version":"3.51.4"},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,9]]},"DOI":"10.1109\/icip.2016.7532925","type":"proceedings-article","created":{"date-parts":[[2016,8,17]],"date-time":"2016-08-17T17:22:06Z","timestamp":1471454526000},"page":"3076-3080","source":"Crossref","is-referenced-by-count":5,"title":["Saliency-context two-stream convnets for action recognition"],"prefix":"10.1109","author":[{"given":"Quan-Qi","family":"Chen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Feng","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xue","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bao-Di","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yu-Jin","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"363","DOI":"10.1007\/3-540-45103-X_50","article-title":"Two-frame motion estimation based on polynomial expansion","author":"farneback","year":"2003","journal-title":"Image Analysis"},{"key":"ref11","article-title":"Beyond short snippets: Deep networks for video classification","author":"ng","year":"2015","journal-title":"arXiv preprint arXiv 1503"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/0166-2236(92)90344-8"},{"key":"ref13","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"arXiv preprint arXiv 1409 1556"},{"key":"ref14","article-title":"Going deeper with convolutions","author":"szegedy","year":"2014","journal-title":"arXiv preprint arXiv 1409 4842"},{"key":"ref15","article-title":"Ucf101: A dataset of 101 human actions classes from videos in the wild","author":"soomro","year":"2012","journal-title":"arXiv preprint arXiv 1212 0402"},{"key":"ref16","first-page":"404","article-title":"Surf: Speeded up robust features","author":"bay","year":"2006","journal-title":"Proc European Conference on Computer Vision"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/358669.358692"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1561\/0600000009"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.360"},{"key":"ref4","first-page":"4305","article-title":"Action recognition with trajectory-pooled deep-convolutional descriptors","author":"wang","year":"2015","journal-title":"Proc IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref3","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995407"},{"key":"ref5","article-title":"Towards Good Practices for Very Deep Two-Stream ConvNets","author":"wang","year":"2015","journal-title":"ArXiv e-prints"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2015.7351168"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.330"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.441"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0636-x"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"ref21","article-title":"Bag of visual words and fusion methods for action recognition: Comprehensive study and good practice","author":"peng","year":"2014","journal-title":"arXiv preprint arXiv 1405 4506"}],"event":{"name":"2016 IEEE International Conference on Image Processing (ICIP)","location":"Phoenix, AZ, USA","start":{"date-parts":[[2016,9,25]]},"end":{"date-parts":[[2016,9,28]]}},"container-title":["2016 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7527113\/7532277\/07532925.pdf?arnumber=7532925","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T16:54:05Z","timestamp":1498323245000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7532925\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,9]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/icip.2016.7532925","relation":{},"subject":[],"published":{"date-parts":[[2016,9]]}}}