{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T13:14:52Z","timestamp":1742994892708,"version":"3.40.3"},"publisher-location":"Cham","reference-count":13,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319466743"},{"type":"electronic","value":"9783319466750"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-46675-0_62","type":"book-chapter","created":{"date-parts":[[2016,9,28]],"date-time":"2016-09-28T09:55:47Z","timestamp":1475056547000},"page":"564-571","source":"Crossref","is-referenced-by-count":4,"title":["Encoding Multi-resolution Two-Stream CNNs for Action Recognition"],"prefix":"10.1007","author":[{"given":"Weichen","family":"Xue","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haohua","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Liqing","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,9,29]]},"reference":[{"key":"62_CR1","doi-asserted-by":"crossref","unstructured":"Arandjelovic, R., Zisserman, A.: All about VLAD. In: CVPR. pp, 1578\u20131585. IEEE (2013)","DOI":"10.1109\/CVPR.2013.207"},{"key":"62_CR2","doi-asserted-by":"crossref","unstructured":"Jain, M., J\u00e9gou, H., Bouthemy, P.: Better exploiting motion for better action recognition. In: CVPR, pp. 2555\u20132562. IEEE (2013)","DOI":"10.1109\/CVPR.2013.330"},{"key":"62_CR3","doi-asserted-by":"crossref","unstructured":"Jain, M., van Gemert, J.C., Snoek, C.G.: What do 15,000 object categories tell us about classifying and localizing actions? In: CVPR, pp. 46\u201355 (2015)","DOI":"10.1109\/CVPR.2015.7298599"},{"key":"62_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"425","DOI":"10.1007\/978-3-642-33715-4_31","volume-title":"Computer Vision \u2013 ECCV 2012","author":"Y-G Jiang","year":"2012","unstructured":"Jiang, Y.-G., Dai, Q., Xue, X., Liu, W., Ngo, C.-W.: Trajectory-based modeling of human actions with motion reference points. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012, Part V. LNCS, vol. 7576, pp. 425\u2013438. Springer, Heidelberg (2012)"},{"key":"62_CR5","doi-asserted-by":"crossref","unstructured":"Karpathy, A., Toderici, G., Shetty, S., Leung, T., Sukthankar, R., Fei-Fei, L.: Large-scale video classification with convolutional neural networks. In: CVPR, pp. 1725\u20131732. IEEE (2014)","DOI":"10.1109\/CVPR.2014.223"},{"key":"62_CR6","doi-asserted-by":"crossref","unstructured":"Marszalek, M., Laptev, I., Schmid, C.: Actions in context. In: CVPR, pp. 2929\u20132936. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206557"},{"key":"62_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"392","DOI":"10.1007\/978-3-642-15552-9_29","volume-title":"Computer Vision \u2013 ECCV 2010","author":"JC Niebles","year":"2010","unstructured":"Niebles, J.C., Chen, C.-W., Fei-Fei, L.: Modeling temporal structure of decomposable motion segments for activity classification. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010, Part II. LNCS, vol. 6312, pp. 392\u2013405. Springer, Heidelberg (2010)"},{"key":"62_CR8","unstructured":"Peng, X., Wang, L., Wang, X., Qiao, Y.: Bag of visual words and fusion methods for action recognition: comprehensive study and good practice. arXiv preprint (2014). arXiv:1405.4506"},{"issue":"3","key":"62_CR9","doi-asserted-by":"crossref","first-page":"222","DOI":"10.1007\/s11263-013-0636-x","volume":"105","author":"J S\u00e1nchez","year":"2013","unstructured":"S\u00e1nchez, J., Perronnin, F., Mensink, T., Verbeek, J.: Image classification with the fisher vector: theory and practice. IJCV 105(3), 222\u2013245 (2013)","journal-title":"IJCV"},{"key":"62_CR10","unstructured":"Simonyan, K., Zisserman, A.: Two-stream convolutional networks for action recognition in videos. In: NIPS, pp. 568\u2013576 (2014)"},{"key":"62_CR11","unstructured":"Soomro, K., Zamir, A.R., Shah, M.: Ucf101: a dataset of 101 human actions classes from videos in the wild. arXiv preprint (2012). arXiv:1212.0402"},{"key":"62_CR12","doi-asserted-by":"crossref","unstructured":"Wang, H., Schmid, C.: Action recognition with improved trajectories. In: ICCV, pp. 3551\u20133558. IEEE (2013)","DOI":"10.1109\/ICCV.2013.441"},{"key":"62_CR13","doi-asserted-by":"crossref","unstructured":"Xu, Z., Yang, Y., Hauptmann, A.G.: A discriminative CNN video representation for event detection. In: CVPR, pp. 1798\u20131807 (2015)","DOI":"10.1109\/CVPR.2015.7298789"}],"container-title":["Lecture Notes in Computer Science","Neural Information Processing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-46675-0_62","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,13]],"date-time":"2019-09-13T22:39:35Z","timestamp":1568414375000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-46675-0_62"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319466743","9783319466750"],"references-count":13,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-46675-0_62","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2016]]}}}