{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,28]],"date-time":"2025-10-28T15:02:44Z","timestamp":1761663764836},"reference-count":54,"publisher":"Springer Science and Business Media LLC","issue":"20","license":[{"start":{"date-parts":[[2018,3,28]],"date-time":"2018-03-28T00:00:00Z","timestamp":1522195200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2018,10]]},"DOI":"10.1007\/s11042-018-5882-z","type":"journal-article","created":{"date-parts":[[2018,3,28]],"date-time":"2018-03-28T14:39:54Z","timestamp":1522247994000},"page":"26635-26655","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":60,"title":["Deep Event Learning boosT-up Approach: DELTA"],"prefix":"10.1007","volume":"77","author":[{"given":"Krishan","family":"Kumar","sequence":"first","affiliation":[]},{"given":"Deepti D.","family":"Shrimankar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,3,28]]},"reference":[{"key":"5882_CR1","doi-asserted-by":"crossref","unstructured":"Alfaro et al (2016) Action recognition in video using sparse coding and relative features. CVPR, 2688\u20132697","DOI":"10.1109\/CVPR.2016.294"},{"issue":"6","key":"5882_CR2","first-page":"729","volume":"24","author":"J Almeida","year":"2013","unstructured":"Almeida J et al (2013) Online video summarization on compressed domain. JVCIR 24(6):729\u2013738","journal-title":"JVCIR"},{"key":"5882_CR3","unstructured":"Anurag K et al (2017) A novel superpixel based color spatial feature for salient object detection. IEEE CICT\u201917"},{"issue":"2","key":"5882_CR4","first-page":"78","volume":"10","author":"R Brunelli","year":"1999","unstructured":"Brunelli R et al (1999) A survey on the automatic indexing of video data. JVCIR 10(2):78\u2013112","journal-title":"JVCIR"},{"key":"5882_CR5","first-page":"I","volume":"1","author":"P Chang","year":"2002","unstructured":"Chang P et al (2002) Extract highlights from baseball game video with hidden markov models. IEEE ICIP 1:I-609","journal-title":"IEEE ICIP"},{"key":"5882_CR6","doi-asserted-by":"crossref","unstructured":"Chang et al (2016) They are not equally reliable: semantic event search using differentiated concept classifiers. CVPR, 1884\u20131893","DOI":"10.1109\/CVPR.2016.208"},{"issue":"7","key":"5882_CR7","first-page":"717","volume":"12","author":"Y Fu","year":"2010","unstructured":"Fu Y et al (2010) Multi view video summmarization. IEEE TMM 12(7):717\u2013729","journal-title":"IEEE TMM"},{"key":"5882_CR8","unstructured":"Fu Y et al (2014) Multi-view metric learning for multi-video video summarization, CoRR, vol. abs\/1405.6434, [Online]. Available: 1405.6434"},{"key":"5882_CR9","unstructured":"Gagandeep S et al (2017) PICS: a novel technique for video summarization. Springer MISP\u201917"},{"key":"5882_CR10","doi-asserted-by":"crossref","unstructured":"Gan et al (2015) Devnet: adeep event network for multimedia event detection and evidence recounting. CVPR, 2568\u20132577","DOI":"10.1109\/CVPR.2015.7298872"},{"key":"5882_CR11","doi-asserted-by":"crossref","unstructured":"Gygli et al (2015) Video summarization by learning submodular mixtures of objectives. CVPR, 3090\u20133098","DOI":"10.1109\/CVPR.2015.7298928"},{"key":"5882_CR12","unstructured":"Hao W et al (2006) Generalized multiclass adaboost and its applications to multimedia classification. CVPR\u201906 Workshop, 113\u2013113"},{"issue":"9","key":"5882_CR13","first-page":"1652","volume":"10","author":"H Jasim","year":"2016","unstructured":"Jasim H et al (2016) Surveillance video summarization based on histogram differencing and sum conditional variance. WASET Inter J Comp Elect Automat Control Inform Engg 10(9):1652\u20131657","journal-title":"WASET Inter J Comp Elect Automat Control Inform Engg"},{"issue":"8","key":"5882_CR14","first-page":"1174","volume":"17","author":"G Jiang","year":"2015","unstructured":"Jiang G et al (2015) Super fast event recognition in internet videos. IEEE TMM 17(8):1174\u20131186","journal-title":"IEEE TMM"},{"key":"5882_CR15","unstructured":"Jones et al (2006) Method and system for object detection in digital images. U.S. Patent No. 7,099,510.29"},{"key":"5882_CR16","unstructured":"Krishan K et al (2017) F-DES: fast and deep event summarization. IEEE TMM"},{"key":"5882_CR17","unstructured":"Krishan K et al (2017) SOMES: an efficient SOM technique for event summarization in multi-view surveillance videos. Springer ICACNI\u201917"},{"key":"5882_CR18","unstructured":"Krishan K et al (2017) V-LESS: a video from linear event summarieS. Springer CVIP\u201917"},{"key":"5882_CR19","unstructured":"Krishan K et al (2017) D-CAD: deep and crowded anomaly detection. ACM ICCCT\u201917"},{"key":"5882_CR20","unstructured":"Krizhevsky A et al (2012) Imagenet classification with deep convolutional neural networks. ANIPS, 1097\u20131105"},{"key":"5882_CR21","first-page":"231","volume":"7","author":"A Krogh","year":"1995","unstructured":"Krogh A et al (1995) Neural network ensembles, cross validation, and active learning. ANIPS 7:231\u2013238","journal-title":"ANIPS"},{"issue":"8","key":"5882_CR22","first-page":"1166","volume":"17","author":"S Kuanar","year":"2015","unstructured":"Kuanar S et al (2015) Multi-view video summarization using bipartite matching constrained optimum-path forest clustering. IEEE TMM 17(8):1166\u20131173","journal-title":"IEEE TMM"},{"key":"5882_CR23","doi-asserted-by":"crossref","unstructured":"Kumar K et al (2016) Equal partition based clustering approach for event summarization in videos. SITIS, 119\u2013126","DOI":"10.1109\/SITIS.2016.27"},{"key":"5882_CR24","unstructured":"Kumar K et al (2017) Key-lectures: keyframes extraction in video lectures. Springer MISP\u201917"},{"key":"5882_CR25","unstructured":"Kumar K et al (2017) Eratosthenes sieve based key-frame extraction technique for event summarization in videos. MTAP, 1\u201322"},{"key":"5882_CR26","doi-asserted-by":"crossref","unstructured":"Kumar K et al (2017) Event BAGGING: a novel event summarization approach in multi-view surveillance videos IEEE IESC\u201917","DOI":"10.1109\/IESPC.2017.8071874"},{"issue":"6","key":"5882_CR27","first-page":"1497","volume":"16","author":"S Lu","year":"2014","unstructured":"Lu S et al (2014) A bag-of-importance model with locality-constrained coding based feature learning for video summarization. IEEE TMM 16(6):1497\u20131509","journal-title":"IEEE TMM"},{"issue":"5","key":"5882_CR28","first-page":"907","volume":"7","author":"F Ma","year":"2005","unstructured":"Ma F et al. (2005) A generic framework of user attention model and its application in video summarization. IEEE TMM 7(5):907\u2013919","journal-title":"IEEE TMM"},{"issue":"8","key":"5882_CR29","first-page":"2214","volume":"16","author":"M Mazloom","year":"2014","unstructured":"Mazloom M et al (2014) Conceptlets: selective semantics for classifying video events. IEEE TMM 16(8):2214\u20132228","journal-title":"IEEE TMM"},{"issue":"7","key":"5882_CR30","first-page":"1378","volume":"18","author":"M Mazloom","year":"2016","unstructured":"Mazloom M et al (2016) TagBook: a semantic video representation without supervision for event detection. IEEE TMM 18(7):1378\u20131388","journal-title":"IEEE TMM"},{"issue":"1","key":"5882_CR31","first-page":"88","volume":"14","author":"M Merler","year":"2012","unstructured":"Merler M et al (2012) Semantic model vectors for complex video event recognition. IEEE TMM 14(1):88\u2013101","journal-title":"IEEE TMM"},{"issue":"2","key":"5882_CR32","first-page":"219","volume":"6","author":"P Mundur","year":"2006","unstructured":"Mundur P et al (2006) Keyframe-based video summarization using Delaunay clustering. IJDL 6(2):219\u2013232","journal-title":"IJDL"},{"key":"5882_CR33","unstructured":"Musfequs S et al (2016) Video summarization using geometric primitives. IEEE DICTA\u201916"},{"key":"5882_CR34","unstructured":"Nagasaka A (1991) Automatic video indexing and full-video search for object appearances. In: Conf. on visual database system, pp 119\u2013133"},{"issue":"1","key":"5882_CR35","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1109\/JSTSP.2014.2331916","volume":"9","author":"H Ou","year":"2015","unstructured":"Ou H et al (2015) On-line multi-view video summarization for wireless video sensor network. IEEE J S T Sig Process 9(1):165\u2013179","journal-title":"IEEE J S T Sig Process"},{"issue":"3","key":"5882_CR36","first-page":"447","volume":"19","author":"C Panagiotakis","year":"2009","unstructured":"Panagiotakis C et al (2009) Equivalent key frames selection based on iso-content principles. TCSVT 19(3):447\u20136451","journal-title":"TCSVT"},{"key":"5882_CR37","doi-asserted-by":"crossref","unstructured":"Potapov D et al (2014) Category-specific video summarization. ECCV, 540\u2013555","DOI":"10.1007\/978-3-319-10599-4_35"},{"issue":"2","key":"5882_CR38","first-page":"233","volume":"18","author":"S Qian","year":"2016","unstructured":"Qian S et al (2016) Multi-modal event topic model for social event analysis. IEEE TMM 18(2):233\u2013246","journal-title":"IEEE TMM"},{"key":"5882_CR39","doi-asserted-by":"crossref","unstructured":"Singh N et al (2016) A convex hull approach in conjunction with Gaussian mixture model for salient object detection. DSP, 22\u201331","DOI":"10.1016\/j.dsp.2016.05.003"},{"issue":"8","key":"5882_CR40","doi-asserted-by":"publisher","first-page":"10521","DOI":"10.1007\/s11042-016-3676-8","volume":"76","author":"Navjot Singh","year":"2016","unstructured":"Singh N et al (2016) A novel position prior using fusion of rule of thirds and image center for salient object detection MTAP. https:\/\/doi.org\/10.1007\/s11042-016-3676-8","journal-title":"Multimedia Tools and Applications"},{"issue":"6","key":"5882_CR41","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1006\/rtim.1999.0197","volume":"6","author":"X Sun","year":"2000","unstructured":"Sun X et al (2000) Video summarization using R-sequences. Real-Time Imag 6 (6):449\u2013459","journal-title":"Real-Time Imag"},{"key":"5882_CR42","doi-asserted-by":"crossref","unstructured":"Valdes V et al (2008) Binary tree based on-line video summarization. ACM TRECVid video summarization workshop, 134\u2013138","DOI":"10.1145\/1463563.1463588"},{"key":"5882_CR43","unstructured":"Vezhnevets A et al (2007) Avoiding boosting overfitting by removing confusing samples. Machine learning: ECML, 430\u2013441"},{"issue":"4","key":"5882_CR44","first-page":"975","volume":"14","author":"M Wang","year":"2012","unstructured":"Wang M et al (2012) Event driven web video summarization by tag localization and key-shot identification. IEEE TMM 14(4):975\u2013985","journal-title":"IEEE TMM"},{"issue":"2","key":"5882_CR45","first-page":"289","volume":"16","author":"S Wang","year":"2014","unstructured":"Wang S et al (2014) Semi-supervised multiple feature analysis for action recognition. IEEE TMM 16(2):289\u2013298","journal-title":"IEEE TMM"},{"issue":"5","key":"5882_CR46","first-page":"1303","volume":"16","author":"F Wang","year":"2014","unstructured":"Wang F et al (2014) Video event detection using motion relativity and feature selection. IEEE TMM 16(5):1303\u20131315","journal-title":"IEEE TMM"},{"key":"5882_CR47","doi-asserted-by":"crossref","unstructured":"Wang et al (2015) Video event recognition with deep hierarchical context model. CVPR, 4418\u20134427","DOI":"10.1109\/CVPR.2015.7299071"},{"key":"5882_CR48","unstructured":"Weber B (2008) Generic object detection using AdaBoost. Department of Computer Science University of California, Santa Cruz"},{"key":"5882_CR49","unstructured":"Wu B et al (2004) Fast rotation invariant multi-view face detection based on real adaboost. IEEE FGR\u201904, 79\u201384"},{"key":"5882_CR50","first-page":"1947","volume":"3","author":"Z Xiong","year":"2004","unstructured":"Xiong Z et al (2004) Effective and efficient sports highlight extraction using the minimum description length criterion in selecting GMM structures. IEEE ICME\u201904 3:1947\u20131950","journal-title":"IEEE ICME\u201904"},{"key":"5882_CR51","doi-asserted-by":"crossref","unstructured":"Xu et al (2015) A discriminative CNN video representation for event detection. CVPR, 1798\u20131807","DOI":"10.1109\/CVPR.2015.7298789"},{"key":"5882_CR52","first-page":"23","volume":"23,3","author":"B Xu","year":"2016","unstructured":"Xu B et al (2016) Fast summarization of user-generated videos: exploiting semantic, emotional, & quality clues. IEEE TMM 23,3:23\u201333","journal-title":"IEEE TMM"},{"issue":"3","key":"5882_CR53","first-page":"346","volume":"17","author":"X Yang","year":"2015","unstructured":"Yang X et al (2015) Automatic visual concept learning for social event understanding. IEEE TMM 17(3):346\u2013358","journal-title":"IEEE TMM"},{"issue":"4","key":"5882_CR54","first-page":"1206","volume":"14","author":"T Zhang","year":"2012","unstructured":"Zhang T et al (2012) A generic framework for video annotation via semi-supervised learning. IEEE TMM 14(4):1206\u20131219","journal-title":"IEEE TMM"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11042-018-5882-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-018-5882-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-018-5882-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,13]],"date-time":"2019-10-13T16:31:12Z","timestamp":1570984272000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11042-018-5882-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,3,28]]},"references-count":54,"journal-issue":{"issue":"20","published-print":{"date-parts":[[2018,10]]}},"alternative-id":["5882"],"URL":"https:\/\/doi.org\/10.1007\/s11042-018-5882-z","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,3,28]]},"assertion":[{"value":"22 March 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 February 2018","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 March 2018","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 March 2018","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}