{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T12:33:44Z","timestamp":1744202024765},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2014,9,28]],"date-time":"2014-09-28T00:00:00Z","timestamp":1411862400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Multimed Info Retr"],"published-print":{"date-parts":[[2015,3]]},"DOI":"10.1007\/s13735-014-0068-6","type":"journal-article","created":{"date-parts":[[2014,9,29]],"date-time":"2014-09-29T15:46:48Z","timestamp":1412005608000},"page":"17-32","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Weakly supervised detection of video events using hidden conditional random fields"],"prefix":"10.1007","volume":"4","author":[{"given":"Kimiaki","family":"Shirahama","sequence":"first","affiliation":[]},{"given":"Marcin","family":"Grzegorzek","sequence":"additional","affiliation":[]},{"given":"Kuniaki","family":"Uehara","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,9,28]]},"reference":[{"key":"68_CR1","unstructured":"Aly R et al (2012) AXES at TRECVid 2012: KIS, INS, and MED. In: Proceedings of TRECVID 2012. http:\/\/www-nlpir.nist.gov\/projects\/tvpubs\/tv12.papers\/axes.pdf"},{"key":"68_CR2","doi-asserted-by":"crossref","unstructured":"Ando R, Shinoda K, Furui S, Mochizuki T (2006) Robust scene recognition using language models for scene contexts. In: Proceedings of MIR 2006, pp 99\u2013106","DOI":"10.1145\/1178677.1178693"},{"key":"68_CR3","unstructured":"Arijon, D (1976) Grammar of the film language. Silman-James Press, Los Angeles"},{"key":"68_CR4","doi-asserted-by":"crossref","unstructured":"Ayache S, Qu\u00e9not G (2008) Video corpus annotation using active learning. In: Proceedings of ECIR 2008, pp 187\u2013198","DOI":"10.1007\/978-3-540-78646-7_19"},{"key":"68_CR5","doi-asserted-by":"crossref","unstructured":"Barnard M, Odobez J (2005) Sports event recognition using layered HMMs. In: Proceedings of ICME 2005, pp 1150\u20131153","DOI":"10.1109\/ICME.2005.1521630"},{"issue":"2","key":"68_CR6","first-page":"123","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L (1996) Bagging predictors. Mach Learn 24(2):123\u2013140","journal-title":"Mach Learn"},{"key":"68_CR7","unstructured":"Cheng H et al. (2012) SRI-Sarnoff AURORA system at TRECVID 2012: Multimedia event detection and recounting. In: Proceedings of TRECVID 2012. http:\/\/www-nlpir.nist.gov\/projects\/tvpubs\/tv12.papers\/aurora.pdf"},{"issue":"4","key":"68_CR8","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1109\/38.126883","volume":"11","author":"G Davenport","year":"1991","unstructured":"Davenport G, Smith TA, Pincever N (1991) Cinematic primitives for multimedia. IEEE Comput Graph Appl 11(4):67\u201374","journal-title":"IEEE Comput Graph Appl"},{"key":"68_CR9","unstructured":"Fujisawa M (2012) Bayon\u2014a simple and fast clustering tool. http:\/\/code.google.com\/p\/bayon\/"},{"issue":"5","key":"68_CR10","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1109\/2.384117","volume":"28","author":"DJ Gemmell","year":"1995","unstructured":"Gemmell DJ, Vin HM, Kandlur DD, Rangan PV, Rowe LA (1995) Multimedia storage servers: a tutorial. IEEE Comput 28(5):40\u201349","journal-title":"IEEE Comput"},{"key":"68_CR11","doi-asserted-by":"crossref","unstructured":"Gunawardana A, Mahajan M, Acero A, Platt JC (2005) Hidden conditional random fields for phone classification. In: Proceedings of INTERSPEECH 2005, pp 1117\u20131120","DOI":"10.21437\/Interspeech.2005-126"},{"issue":"9","key":"68_CR12","doi-asserted-by":"crossref","first-page":"1263","DOI":"10.1109\/TKDE.2008.239","volume":"21","author":"H He","year":"2009","unstructured":"He H, Garcia EA (2009) Learning from imbalanced data. IEEE Trans Knowl Data Eng 21(9):1263\u20131284","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"68_CR13","unstructured":"Inoue N, Wada T, Kamishima Y, Shinoda K, Sato S (2011) TokyoTech+Canon at TRECVID 2011. In: Proceedings of TRECVID 2011. http:\/\/www-nlpir.nist.gov\/projects\/tvpubs\/tv11.papers\/tokyotechcanon.pdf"},{"issue":"2","key":"68_CR14","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1007\/s13735-012-0024-2","volume":"2","author":"YG Jiang","year":"2013","unstructured":"Jiang YG, Bhattacharya S, Chang SF, Shah M (2013) High-level event recognition in unconstrained videos. Int J Multimed Inf Retr 2(2):73\u2013101","journal-title":"Int J Multimed Inf Retr"},{"key":"68_CR15","unstructured":"Lafferty JD, McCallum A, Pereira FCN (2001) Conditional random fields: probabilistic models for segmenting and labeling sequence data. In: Proceedings of ICML 2001, pp 282\u2013289"},{"key":"68_CR16","doi-asserted-by":"crossref","unstructured":"Li W, Yu Q, Divakaran A, Vasconcelos N (2013) Dynamic pooling for complex event recognition. In: Proceedings of ICCV 2013, pp 2728\u20132735","DOI":"10.1109\/ICCV.2013.339"},{"key":"68_CR17","doi-asserted-by":"crossref","unstructured":"Li X, Snoek CGM (2009) Visual categorization with negative examples for free. In: Proceedings of MM 2009, pp 661\u2013664","DOI":"10.1145\/1631272.1631382"},{"key":"68_CR18","doi-asserted-by":"crossref","unstructured":"Liu J, McCloskey S, Liu Y (2012) Local expert forest of score fusion for video event classification. In: Proceedings of ECCV 2012, pp 397\u2013410","DOI":"10.1007\/978-3-642-33715-4_29"},{"key":"68_CR19","unstructured":"Mann TP (2006) Numerically stable hidden Markov model implementation. http:\/\/bozeman.genome.washington.edu\/compbio\/mbt599_2006\/hmm_scaling_revised.pdf , HMM Scaling Tutorial"},{"issue":"3","key":"68_CR20","doi-asserted-by":"crossref","first-page":"86","DOI":"10.1109\/MMUL.2006.63","volume":"13","author":"M Naphade","year":"2006","unstructured":"Naphade M et al (2006) Large-scale concept ontology for multimedia. IEEE Multimed 13(3):86\u201391","journal-title":"IEEE Multimed"},{"issue":"10","key":"68_CR21","doi-asserted-by":"crossref","first-page":"1848","DOI":"10.1109\/TPAMI.2007.1124","volume":"29","author":"A Quattoni","year":"2007","unstructured":"Quattoni A, Wang S, Morency L, Collins M, Darrell T (2007) Hidden conditional random fields. IEEE Trans Pattern Anal Mach Intell 29(10):1848\u20131852","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"5","key":"68_CR22","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1007\/s005300050138","volume":"7","author":"Y Rui","year":"1999","unstructured":"Rui Y, Huang TS, Mehrotra S (1999) Constructing table-of-content for videos. Multimed Syst 7(5):359\u2013368","journal-title":"Multimed Syst"},{"issue":"3","key":"68_CR23","first-page":"21","volume":"1","author":"K Shirahama","year":"2008","unstructured":"Shirahama K, Uehara K (2008) A novel topic extraction method based on bursts in video streams. Int J Hybrid Inf Technol 1(3):21\u201332","journal-title":"Int J Hybrid Inf Technol"},{"key":"68_CR24","unstructured":"Shirahama K, Uehara K (2012) Kobe university and Muroran institute of technology at TRECVID 2012 semantic indexing task. In: Proceedings of TRECVID 2012. http:\/\/www-nlpir.nist.gov\/projects\/tvpubs\/tv12.papers\/kobe-muroran.pdf"},{"key":"68_CR25","doi-asserted-by":"crossref","unstructured":"Smeaton AF, Over P, Kraaij W (2006) Evaluation campaigns and TRECVid. In: Proceedings of MIR 2006, pp 321\u2013330","DOI":"10.1145\/1178677.1178722"},{"key":"68_CR26","doi-asserted-by":"crossref","unstructured":"Smucker MD, Allan J, Carterette B (2007) A comparison of statistical significance tests for information retrieval evaluation. In: Proceedings of CIKM 2007, pp 623\u2013632","DOI":"10.1145\/1321440.1321528"},{"issue":"4","key":"68_CR27","doi-asserted-by":"crossref","first-page":"215","DOI":"10.1561\/1500000014","volume":"2","author":"CGM Snoek","year":"2009","unstructured":"Snoek CGM, Worring M (2009) Concept-based video retrieval. Found Trends Inf Retr 2(4):215\u2013322","journal-title":"Found Trends Inf Retr"},{"key":"68_CR28","unstructured":"Strassel, S et al. (2012) Creating HAVIC: heterogeneous audio visual internet collection. In: Proceedings of LREC 2012, pp 2573\u20132577"},{"key":"68_CR29","doi-asserted-by":"crossref","unstructured":"Sun C, Nevatia R (2013) ACTIVE: activity concept transitions in video event classification. In: Proceedings of ICCV 2013, pp 913\u2013920","DOI":"10.1109\/ICCV.2013.453"},{"issue":"1","key":"68_CR30","first-page":"34","volume":"82","author":"K Tanaka","year":"1999","unstructured":"Tanaka K, Ariki Y, Uehara K (1999) Organization and retrieval of video data. IEICE Trans Inf Syst 82(1):34\u201344","journal-title":"IEICE Trans Inf Syst"},{"key":"68_CR31","doi-asserted-by":"crossref","unstructured":"Vahdat A, Cannons K, Mori G, Oh S, Kim I (2013) Compositional models for video event detection: a multiple kernel learning latent variable approach. In: Proceedings of ICCV 2013, pp 1185\u2013 1192","DOI":"10.1109\/ICCV.2013.463"},{"key":"68_CR32","unstructured":"Wang SB, Quattoni A, Morency L, Demirdjian D, Darrell T (2006a) Hidden conditional random fields for gesture recognition. In: Proceedings of CVPR 2006, pp 1521\u20131527"},{"key":"68_CR33","unstructured":"Wang T, Li J, Diao Q, Hu W, Zhang Y, Dulong C (2006b) Semantic event detection using conditional random fields. In: Proceedings of CVPRW 2006"},{"key":"68_CR34","unstructured":"Yin J, Hu DH, Yang Q (2009) Spatio-temporal event detection using dynamic conditional random fields. In: Proceedings of IJCAI 2009, pp 1321\u20131326"},{"key":"68_CR35","unstructured":"Young S et al (2009) The HTK Book (for HTK Version 3.4). Cambridge University Engineering Department. http:\/\/htk.eng.cam.ac.uk\/"},{"issue":"1","key":"68_CR36","doi-asserted-by":"crossref","first-page":"70","DOI":"10.1109\/TKDE.2004.1264823","volume":"16","author":"H Yu","year":"2004","unstructured":"Yu H, Han J, Chang KC (2004) PEBL: Web page classification without negative examples. IEEE Trans Knowl Data Eng 16(1):70\u201381","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"68_CR37","doi-asserted-by":"crossref","unstructured":"Zhai Y, Rasheed Z, Shah M (2004) A framework for semantic classification of scenes using finite state machines. In: Proceedings of CIVR 2004, pp 279\u2013288","DOI":"10.1007\/978-3-540-27814-6_35"},{"issue":"1","key":"68_CR38","doi-asserted-by":"crossref","first-page":"197","DOI":"10.1016\/j.patcog.2009.05.015","volume":"43","author":"J Zhang","year":"2010","unstructured":"Zhang J, Gong S (2010) Action categorization with modified hidden conditional random field. Pattern Recognit 43(1):197\u2013203","journal-title":"Pattern Recognit"}],"container-title":["International Journal of Multimedia Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13735-014-0068-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s13735-014-0068-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13735-014-0068-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,18]],"date-time":"2022-04-18T05:36:51Z","timestamp":1650260211000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s13735-014-0068-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,9,28]]},"references-count":38,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,3]]}},"alternative-id":["68"],"URL":"https:\/\/doi.org\/10.1007\/s13735-014-0068-6","relation":{},"ISSN":["2192-6611","2192-662X"],"issn-type":[{"value":"2192-6611","type":"print"},{"value":"2192-662X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,9,28]]}}}