{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2022,3,31]],"date-time":"2022-03-31T15:44:55Z","timestamp":1648741495280},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2015,9,17]],"date-time":"2015-09-17T00:00:00Z","timestamp":1442448000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1007\/s11042-015-2876-y","type":"journal-article","created":{"date-parts":[[2015,9,17]],"date-time":"2015-09-17T08:56:43Z","timestamp":1442480203000},"page":"2453-2472","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A bag-of-regions representation for video classification"],"prefix":"10.1007","volume":"75","author":[{"given":"Min-Kook","family":"Choi","sequence":"first","affiliation":[]},{"given":"Ziyu","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Hyun-Gyu","family":"Lee","sequence":"additional","affiliation":[]},{"given":"Sang-Chul","family":"Lee","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,9,17]]},"reference":[{"key":"2876_CR1","doi-asserted-by":"crossref","unstructured":"Abd-Almageed W (2008) Online, simultaneous shot boundary detection and key frame extraction for sports videos using rank tracing. In: Proceedings of International Conference on Image Processing","DOI":"10.1109\/ICIP.2008.4712476"},{"key":"2876_CR2","doi-asserted-by":"crossref","unstructured":"Bandla S, Grauman K (2013) Active learning of an action detector from untrimmed videos. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2013.230"},{"key":"2876_CR3","doi-asserted-by":"crossref","unstructured":"Banerjee P, Sengupta S (2008) Model generation for robust object tracking based on temporally stable regions. In: IEEE Workshop on Motion and Video Computing","DOI":"10.1109\/WMVC.2008.4544045"},{"issue":"3","key":"2876_CR4","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/j.cviu.2007.09.014","volume":"110","author":"H Bay","year":"2008","unstructured":"Bay H, Ess A, Tuytelaars T, Gool LV (2008) Surf: Speeded up robust features. Comp Vision Image Underst 110(3):346\u2013359","journal-title":"Comp Vision Image Underst"},{"key":"2876_CR5","doi-asserted-by":"crossref","unstructured":"Black M, Gorelick L, Shechtman E, Irani M, Basri R (2005) Actions as space-time shape. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2005.28"},{"key":"2876_CR6","doi-asserted-by":"crossref","unstructured":"Blilen H, Gool LV (2011) Action recognition: A region based approach. In: IEEE Workshop on Applications of Computer Vision","DOI":"10.1109\/WACV.2011.5711517"},{"key":"2876_CR7","doi-asserted-by":"crossref","unstructured":"Bojanowski P, Bach F, Laptev I, Ponce J, Schmid C, Sivic J (2013) Finding actors and actions in movies. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/ICCV.2013.283"},{"key":"2876_CR8","doi-asserted-by":"crossref","unstructured":"Brendal W, Todorovic S (2009) Video object segmentation by tracking regions. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2009.5459242"},{"key":"2876_CR9","doi-asserted-by":"crossref","first-page":"396","DOI":"10.1016\/j.cviu.2011.09.010","volume":"116","author":"B Chakraborty","year":"2012","unstructured":"Chakraborty B, Holtre MB, Moesl TB, Gonzalez J (2012) Selective space-time interest points. Comput Vis Image Underst 116:396\u2013410","journal-title":"Comput Vis Image Underst"},{"issue":"27","key":"2876_CR10","first-page":"1","volume":"2","author":"CC Chang","year":"2011","unstructured":"Chang CC, Lin CJ (2011) Libsvm: A library for support vector machine. ACM Transactions on IST 2(27):1\u201327. Software available at http:\/\/www.scie.ntu.edu.tw\/cjlin\/libsvm","journal-title":"ACM Transactions on IST"},{"key":"2876_CR11","doi-asserted-by":"crossref","first-page":"660","DOI":"10.1016\/j.cviu.2013.02.003","volume":"117","author":"J Choi","year":"2013","unstructured":"Choi J, Wang Z, Lee SC, Jeon WJ (2013) A spatio-temporal pyramid matching for video retrieval. Comp Vision Image Underst 117:660\u2013669","journal-title":"Comp Vision Image Underst"},{"key":"2876_CR12","doi-asserted-by":"crossref","unstructured":"Dalal N, Triggs B (2005) Histograms of oriented gradients for human detection. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2005.177"},{"key":"2876_CR13","doi-asserted-by":"crossref","unstructured":"Dalal N, Triggs B, Schmid C (2006) Human detection using oriented histograms of flow and appearance. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1007\/11744047_33"},{"key":"2876_CR14","unstructured":"Demir G, Selim A (2007) Scene classification using bag-of-regions representations. In: Proceedings of Computer Vision and Pattern Recognition"},{"issue":"8","key":"2876_CR15","doi-asserted-by":"crossref","first-page":"800","DOI":"10.1109\/34.946985","volume":"23","author":"Y Deng","year":"2011","unstructured":"Deng Y, Manjunath BS (2011) Unsupervised segmentation of color-texture regions in images and video. IEEE Transactions on Pattern Analysis and Machine Intelligence 23(8):800\u2013810","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2876_CR16","unstructured":"Gonzalez RC, Woods RE Digital image processing. Pearson Prentice Hall"},{"key":"2876_CR17","doi-asserted-by":"crossref","unstructured":"Jhuang H, Gall J, Zuffi S, Schmid C, Black MJ (2013) Towards understanding action recognition. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2013.396"},{"issue":"1","key":"2876_CR18","doi-asserted-by":"crossref","first-page":"172","DOI":"10.1109\/TPAMI.2010.68","volume":"33","author":"IN Junejo","year":"2010","unstructured":"Junejo IN, Dexter E, Laptev I, Perez P (2010) View-independent action recognition from temporal self-similarities. IEEE Transactions on Pattern Analysis and Machine Intelligence 33(1):172\u2013185","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2876_CR19","unstructured":"Ke Y, Sukthankar R (2004) Pca-sift: A more distinctive representation for local image descriptors. In: Proceedings of Computer Vision and Pattern Recognition"},{"key":"2876_CR20","doi-asserted-by":"crossref","unstructured":"Kovashka A, Grauman K (2010) Learning a hierarchy of discriminative space-time neighborhood features for human action recognition. In: Proceedings of Computer Vision and Pattern Recognition, pp 2046\u20132053","DOI":"10.1109\/CVPR.2010.5539881"},{"key":"2876_CR21","doi-asserted-by":"crossref","unstructured":"Kuehne H, Jhuang H, Garrote E, Poggio T, Serre T (2011) Hmdb: A large video database for human motion recognition. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2011.6126543"},{"key":"2876_CR22","first-page":"207","volume":"108","author":"I Laptev","year":"2005","unstructured":"Laptev I (2005) On space-time interest points. Int J Comput Vis 108:207\u2013229","journal-title":"Int J Comput Vis"},{"key":"2876_CR23","unstructured":"Lazebnik S, Schmid C, Ponce J (2006) Finding actors and actions in movies. In: Proceedings of Computer Vision and Pattern Recognition"},{"key":"2876_CR24","doi-asserted-by":"crossref","unstructured":"Leutenegger S, Chli M, Siegwart RY (2011) Brisk: Binary robust invariant scalable keypoints. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2011.6126542"},{"key":"2876_CR25","doi-asserted-by":"crossref","unstructured":"Li LJ, Fei LF (2007) What, where and who? classifying events by scene and object recognition. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2007.4408872"},{"key":"2876_CR26","doi-asserted-by":"crossref","unstructured":"Liu J, Luo J, Shah M (2009) Recognizing realistic actions from videos \u201cin the wild\u201d. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2009.5206744"},{"key":"2876_CR27","unstructured":"Lowe DG (2005) Object recognition from local scale-invariant features. In: Proceedings of International Conference on Computer Vision"},{"key":"2876_CR28","unstructured":"Makadia A (2010) Feature tracking for wide-baseline image. In: Proceedings of European Conference on Computer Vision, pp 310\u2013323"},{"key":"2876_CR29","doi-asserted-by":"crossref","unstructured":"Marszalek M, Latev I, Schmid C (2009) Action in context. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2009.5206557"},{"issue":"5","key":"2876_CR30","doi-asserted-by":"crossref","first-page":"1267","DOI":"10.1109\/25.950328","volume":"50","author":"O Masoud","year":"2001","unstructured":"Masoud O, Papanikolopoulos NP (2001) A novel method for tracking and counting pedestrians in real-time using a single camera. Veh Technol 50(5):1267\u20131278","journal-title":"Veh Technol"},{"key":"2876_CR31","doi-asserted-by":"crossref","unstructured":"McCandless T, Grauman K (2013) Object-centric spatio-temporal pyramids for egocentric activity recognition. In: Proceedings of British Machine Vision Conference","DOI":"10.5244\/C.27.30"},{"key":"2876_CR32","doi-asserted-by":"crossref","unstructured":"Niebles J, Chen C, Fei LF (2010) Modeling temporal structure of decomposable motion segments for activity classification. In: Proceedings of European Conference on Computer Vision","DOI":"10.1007\/978-3-642-15552-9_29"},{"key":"2876_CR33","doi-asserted-by":"crossref","unstructured":"Pirsiavash H, Ramanan D (2012) Detecting activities of daily living in first-person camera view. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2012.6248010"},{"key":"2876_CR34","doi-asserted-by":"crossref","unstructured":"Raptis M, Sigal K (2013) Poselet key-framing: A model for human activity recognition. In: Proceedings of Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2013.342"},{"key":"2876_CR35","doi-asserted-by":"crossref","unstructured":"Schuldt C, Laptev I, Caputo B (2004) Recognizing human action: A local svm approach. In: Proceedings of International Conference on Pattern Recognition","DOI":"10.1109\/ICPR.2004.1334462"},{"issue":"2","key":"2876_CR36","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1007\/s11263-005-4264-y","volume":"67","author":"J Sivic","year":"2006","unstructured":"Sivic J, Schaffalitzky F (2006) Object level grouping for video shots. Int J Comput Vis 67(2):189\u2013210","journal-title":"Int J Comput Vis"},{"key":"2876_CR37","doi-asserted-by":"crossref","unstructured":"Sivic J, Zisserman A (2003) Video google: A text retrieval approach to object matching in videos. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2003.1238663"},{"key":"2876_CR38","doi-asserted-by":"crossref","unstructured":"Turcot P, Lowe DG (2009) Better matching with fewer features: The selection of useful features in large database recognition problems. In: International Conference of Computer Vision Workshops, pp 2109\u20132116","DOI":"10.1109\/ICCVW.2009.5457541"},{"key":"2876_CR39","doi-asserted-by":"crossref","unstructured":"Ullah MM, Laptev I (2012) Actlets: A novel local representation for human action recognition in video. In: Proceedings of International Conference on Image Processing, pp 777\u2013780","DOI":"10.1109\/ICIP.2012.6466975"},{"issue":"10","key":"2876_CR40","doi-asserted-by":"crossref","first-page":"818","DOI":"10.3844\/jcssp.2007.818.822","volume":"3","author":"A Umamakeswari","year":"2007","unstructured":"Umamakeswari A, Rajaraman A (2007) Object based video analysis, interpretation and tracking. J Comput Sci 3(10):818\u2013822","journal-title":"J Comput Sci"},{"key":"2876_CR41","volume-title":"Statistical learning theory","author":"V Vapnik","year":"1998","unstructured":"Vapnik V (1998) Statistical learning theory. Wiley, Hoboken"},{"key":"2876_CR42","doi-asserted-by":"crossref","unstructured":"Wang H, Ullah MM, Klaser A, Laptev I, Schmid C (2009) Evaluation of local spatio-temporal features for action recognition. In: Proceedings of British Machine Vision Conference","DOI":"10.5244\/C.23.124"},{"key":"2876_CR43","doi-asserted-by":"crossref","unstructured":"Weinland D, Boyer E, Ronfard R (2007) Action recognition from arbitrary views using 3d exemplars. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2007.4408849"},{"key":"2876_CR44","doi-asserted-by":"crossref","unstructured":"Yao B, Jiang X, Khosla A, Lin AL, Guibas L, Fei LF (2011) Human action recognition by learning bases of action attributes and parts. In: Proceedings of International Conference on Computer Vision","DOI":"10.1109\/ICCV.2011.6126386"},{"key":"2876_CR45","doi-asserted-by":"crossref","first-page":"196","DOI":"10.1016\/j.cviu.2003.08.001","volume":"92","author":"L Ying","year":"2003","unstructured":"Ying L, Der WT, Neng HJ (2003) Object-based analysis and interpretation of human motion in sports video sequences by dynamic bayesian networks. Comp Vision Image Underst 92:196\u2013216","journal-title":"Comp Vision Image Underst"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-015-2876-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11042-015-2876-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-015-2876-y","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,30]],"date-time":"2019-08-30T17:31:37Z","timestamp":1567186297000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11042-015-2876-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,9,17]]},"references-count":45,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2016,3]]}},"alternative-id":["2876"],"URL":"https:\/\/doi.org\/10.1007\/s11042-015-2876-y","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,9,17]]}}}