{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T16:34:19Z","timestamp":1775579659371,"version":"3.50.1"},"reference-count":23,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2012,11,16]],"date-time":"2012-11-16T00:00:00Z","timestamp":1353024000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Machine Vision and Applications"],"published-print":{"date-parts":[[2013,7]]},"DOI":"10.1007\/s00138-012-0450-4","type":"journal-article","created":{"date-parts":[[2012,11,15]],"date-time":"2012-11-15T08:18:31Z","timestamp":1352967511000},"page":"971-981","source":"Crossref","is-referenced-by-count":498,"title":["Recognizing 50 human action categories of web videos"],"prefix":"10.1007","volume":"24","author":[{"given":"Kishore K.","family":"Reddy","sequence":"first","affiliation":[]},{"given":"Mubarak","family":"Shah","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,11,16]]},"reference":[{"key":"450_CR1","doi-asserted-by":"crossref","unstructured":"Bobick, A.F., Davis, J.W.: The recognition of human movement using temporal templates. In: IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 23, 257\u2013267 (2001)","DOI":"10.1109\/34.910878"},{"key":"450_CR2","doi-asserted-by":"crossref","unstructured":"Choi, W., Shahid, K., Savarese, S.: Learning context for collective activity recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 3273\u20133280 (2011)","DOI":"10.1109\/CVPR.2011.5995707"},{"key":"450_CR3","doi-asserted-by":"crossref","unstructured":"Deng, J., Berg, A.C., Li, K., Fei-Fei, L.: What does classifying more than 10,000 image categories tell us? In: Proceedings of the 11th European Conference on Computer Vision: Part V, pp. 71\u201384 (2010)","DOI":"10.1007\/978-3-642-15555-0_6"},{"key":"450_CR4","doi-asserted-by":"crossref","unstructured":"Dollar, P., Rabaud, V., Cottrell, G., Belongie, S.: Behavior recognition via sparse spatio-temporal features. In: 2nd Joint IEEE International Workshop on Visual Surveillance and Performance Evaluation of Tracking and Surveillance, pp. 65\u201372 (2005)","DOI":"10.1109\/VSPETS.2005.1570899"},{"key":"450_CR5","doi-asserted-by":"crossref","unstructured":"Han, D., Bo, L., Sminchisescu, C.: Selection and context for action recognition. In: IEEE 12th International Conference on Computer Vision, pp. 1933\u20131940 (2009)","DOI":"10.1109\/ICCV.2009.5459427"},{"key":"450_CR6","doi-asserted-by":"crossref","unstructured":"Hong, P., Huang, T.S., Turk, M.: Gesture modeling and recognition using finite state machines. In: Proceedings of the Fourth IEEE International Conference on Automatic Face and Gesture Recognition, pp. 410\u2013415 (2000)","DOI":"10.1109\/AFGR.2000.840667"},{"key":"450_CR7","doi-asserted-by":"crossref","unstructured":"Ikizler-Cinbis, N., Sclaroff, S.: Object, scene and actions: combining multiple features for human action recognition. In: Proceedings of the 11th European Conference on Computer Vision: Part I, pp. 494\u2013507 (2010)","DOI":"10.1007\/978-3-642-15549-9_36"},{"key":"450_CR8","doi-asserted-by":"crossref","unstructured":"Kuehne, H., Jhuang, H., Garrote, E., Poggio, T., Serre, T.: Hmdb: a large video database for human motion recognition. In: Proceedings of the International Conference on Computer Vision, pp. 2556\u20132563 (2011)","DOI":"10.1109\/ICCV.2011.6126543"},{"key":"450_CR9","doi-asserted-by":"crossref","unstructured":"Laptev, I., Marszalek, M., Schmid, C., Rozenfeld, B.: Learning realistic human actions from movies. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20138 (2008)","DOI":"10.1109\/CVPR.2008.4587756"},{"key":"450_CR10","doi-asserted-by":"crossref","unstructured":"Liu, J., Luo, J., Shah, M.: Recognizing realistic actions from videos \u201cin the wild\u201d. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1996\u20132003 (2009)","DOI":"10.1109\/CVPR.2009.5206744"},{"key":"450_CR11","doi-asserted-by":"crossref","unstructured":"Liu, J., Shah, M.: Learning human actions via information maximization. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20138 (2008)","DOI":"10.1109\/CVPR.2008.4587723"},{"key":"450_CR12","unstructured":"Lucas, B.D., Kanade, T.: An iterative image registration technique with an application to stereo vision. In: Proceedings of the 7th International Joint Conference on Artificial Intelligence, vol. 2, pp. 674\u2013679 (1981)"},{"key":"450_CR13","doi-asserted-by":"crossref","unstructured":"Marszalek, M., Laptev, I., Schmid, C.: Actions in context. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 2929\u20132936 (2009)","DOI":"10.1109\/CVPRW.2009.5206557"},{"key":"450_CR14","doi-asserted-by":"crossref","unstructured":"van de Sande, K., Gevers, T., Snoek, C.: Evaluating color descriptors for object and scene recognition. In: IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 32, pp. 1582\u20131596 (2010)","DOI":"10.1109\/TPAMI.2009.154"},{"key":"450_CR15","doi-asserted-by":"crossref","unstructured":"Scovanner, P., Ali, S., Shah, M.: A 3-dimensional sift descriptor and its application to action recognition. In: Proceedings of the 15th International Conference on Multimedia, pp. 357\u2013360 (2007)","DOI":"10.1145\/1291233.1291311"},{"key":"450_CR16","doi-asserted-by":"crossref","unstructured":"Snoek, C.G.M., Worring, M., Smeulders, A.W.M.: Early versus late fusion in semantic video analysis. In: Proceedings of the 13th Annual ACM International Conference on Multimedia, pp. 399\u2013402 (2005)","DOI":"10.1145\/1101149.1101236"},{"key":"450_CR17","doi-asserted-by":"crossref","unstructured":"Song, Y., Zhao, M., Yagnik, J., Wu, X.: Taxonomic classification for web-based videos. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 871\u2013878 (2010)","DOI":"10.1109\/CVPR.2010.5540124"},{"key":"450_CR18","doi-asserted-by":"crossref","unstructured":"Wang., H., Klaser., A., Liu., C.L.: Action recognition by dense trajectories. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 3169\u20133176 (2011)","DOI":"10.1109\/CVPR.2011.5995407"},{"key":"450_CR19","doi-asserted-by":"crossref","unstructured":"Wang, Z., Zhao, M., Song, Y., Kumar, S., Li, B.: Youtubecat: learning to categorize wild web videos. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 879\u2013886 (2010)","DOI":"10.1109\/CVPR.2010.5540125"},{"key":"450_CR20","doi-asserted-by":"crossref","unstructured":"Weinland, D., Ronfard, R., Boyer, E.: A survey of vision-based methods for action representation, segmentation and recognition. In: Computer Vision and Image Understanding, vol. 115, pp. 224\u2013241 (2011)","DOI":"10.1016\/j.cviu.2010.10.002"},{"key":"450_CR21","doi-asserted-by":"crossref","unstructured":"Wilson, A., Bobick, A.: Parametric hidden markov models for gesture recognition. In: IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 21, pp. 884\u2013900 (1999)","DOI":"10.1109\/34.790429"},{"key":"450_CR22","doi-asserted-by":"crossref","unstructured":"Wong, S.F., Kim, T.K., Cipolla, R.: Learning motion categories using both semantic and structural information. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20136 (2007)","DOI":"10.1109\/CVPR.2007.383332"},{"key":"450_CR23","doi-asserted-by":"crossref","unstructured":"Zheng, Y.T., Neo, S.Y., Chua, T.S., Tian, Q.: Probabilistic optimized ranking for multimedia semantic concept detection via rvm. In: Proceedings of International Conference on Content-Based Image and Video Retrieval, pp. 161\u2013168 (2008)","DOI":"10.1145\/1386352.1386378"}],"container-title":["Machine Vision and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-012-0450-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00138-012-0450-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-012-0450-4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,20]],"date-time":"2025-04-20T22:27:09Z","timestamp":1745188029000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00138-012-0450-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,11,16]]},"references-count":23,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2013,7]]}},"alternative-id":["450"],"URL":"https:\/\/doi.org\/10.1007\/s00138-012-0450-4","relation":{},"ISSN":["0932-8092","1432-1769"],"issn-type":[{"value":"0932-8092","type":"print"},{"value":"1432-1769","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,11,16]]}}}