{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,25]],"date-time":"2025-12-25T16:04:00Z","timestamp":1766678640987,"version":"3.37.3"},"reference-count":39,"publisher":"Springer Science and Business Media LLC","issue":"37-38","license":[{"start":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T00:00:00Z","timestamp":1596067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T00:00:00Z","timestamp":1596067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2020,10]]},"DOI":"10.1007\/s11042-020-09312-8","type":"journal-article","created":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T11:26:38Z","timestamp":1596108398000},"page":"27995-28022","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Video retrieval using salient foreground region of motion vector based extracted keyframes and spatial pyramid matching"],"prefix":"10.1007","volume":"79","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4770-9506","authenticated-orcid":false,"given":"Ajay Kumar","family":"Mallick","sequence":"first","affiliation":[]},{"given":"Susanta","family":"Mukhopadhyay","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,7,30]]},"reference":[{"key":"9312_CR1","doi-asserted-by":"crossref","unstructured":"Achanta R, Hemami S, Estrada F, Susstrunk S (2009) Frequency-tuned salient region detection. In: IEEE conference on computer vision and pattern recognition. CVPR 2009. IEEE, pp 1597\u20131604","DOI":"10.1109\/CVPR.2009.5206596"},{"key":"9312_CR2","unstructured":"Albregtsen F, et al. (2008) Statistical texture measures computed from gray level coocurrence matrices. Image Processing Laboratory, Department of Informatics, University of Oslo, p 5"},{"issue":"11","key":"9312_CR3","doi-asserted-by":"publisher","first-page":"14465","DOI":"10.1007\/s11042-018-6826-3","volume":"78","author":"SS Aote","year":"2019","unstructured":"Aote SS, Potnurwar A (2019) An automatic video annotation framework based on two level keyframe extraction mechanism. Multimed Tools Appl 78 (11):14465\u201314484","journal-title":"Multimed Tools Appl"},{"key":"9312_CR4","doi-asserted-by":"crossref","unstructured":"Bay H, Tuytelaars T, Van Gool L (2006) Surf: speeded up robust features. In: European conference on computer vision. Springer, pp 404\u2013417","DOI":"10.1007\/11744023_32"},{"key":"9312_CR5","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1016\/j.eswa.2018.11.016","volume":"119","author":"B-B Benuwa","year":"2019","unstructured":"Benuwa B-B, Zhan Y, Monney A, Ghansah B, Ansah EK (2019) Video semantic analysis based kernel locality-sensitive discriminative sparse representation. Exp Syst Appl 119:429\u2013440","journal-title":"Exp Syst Appl"},{"issue":"9","key":"9312_CR6","doi-asserted-by":"publisher","first-page":"1667","DOI":"10.1109\/TPAMI.2011.265","volume":"34","author":"L Duan","year":"2011","unstructured":"Duan L, Xu D, Tsang IW-H, Luo J (2011) Visual event recognition in videos by learning from web data. IEEE Trans Pattern Anal Mach Intell 34(9):1667\u20131680","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"9","key":"9312_CR7","doi-asserted-by":"publisher","first-page":"1627","DOI":"10.1109\/TPAMI.2009.167","volume":"32","author":"PF Felzenszwalb","year":"2009","unstructured":"Felzenszwalb PF, Girshick RB, McAllester D (2009) Object detection with discriminatively trained part-based models. IEEE Trans Pattern Anal Mach Intell 32(9):1627\u20131645","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"7","key":"9312_CR8","doi-asserted-by":"publisher","first-page":"1762","DOI":"10.1109\/TMM.2018.2885237","volume":"21","author":"Y Feng","year":"2018","unstructured":"Feng Y, Zhou P, Xu J, Ji S, Wu D, Video big data retrieval over media cloud (2018) A context-aware online learning approach. IEEE Trans Multimed 21(7):1762\u20131777","journal-title":"IEEE Trans Multimed"},{"issue":"9","key":"9312_CR9","doi-asserted-by":"publisher","first-page":"2045","DOI":"10.1109\/TMM.2017.2729019","volume":"19","author":"L Gao","year":"2017","unstructured":"Gao L, Guo Z, Zhang H, Xu X, Shen HT (2017) Video captioning with attention-based lstm and semantic consistency. IEEE Trans Multimed 19 (9):2045\u20132055","journal-title":"IEEE Trans Multimed"},{"issue":"1","key":"9312_CR10","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1007\/s11554-006-0001-1","volume":"1","author":"C Gianluigi","year":"2006","unstructured":"Gianluigi C, Raimondo S (2006) An innovative algorithm for key frame extraction in video summarization. J Real-Time Image Process 1(1):69\u201388","journal-title":"J Real-Time Image Process"},{"key":"9312_CR11","doi-asserted-by":"crossref","unstructured":"Grauman K, Darrell T (2005) The pyramid match kernel: discriminative classification with sets of image features. In: Tenth IEEE international conference on computer vision (ICCV\u201905) volume 1, vol 2. IEEE, pp 1458\u20131465","DOI":"10.1109\/ICCV.2005.239"},{"issue":"3","key":"9312_CR12","doi-asserted-by":"publisher","first-page":"73","DOI":"10.3390\/e18030073","volume":"18","author":"Y Guo","year":"2016","unstructured":"Guo Y, Xu Q, Sun S, Luo X, Sbert M (2016) Selecting video key frames based on relative entropy and the extreme studentized deviate test. Entropy 18 (3):73","journal-title":"Entropy"},{"key":"9312_CR13","unstructured":"Itti L, Braun J, Lee DK, Koch C (1999) Attentional modulation of human pattern discrimination psychophysics reproduced by a quantitative model. In: Advances in neural information processing systems, pp 789\u2013795"},{"key":"9312_CR14","doi-asserted-by":"crossref","unstructured":"Jiang H, Wang J, Yuan Z, Liu T, Zheng N, Li S (2011) Automatic salient object segmentation based on context and shape prior. In: BMVC, vol 6, p 9","DOI":"10.5244\/C.25.110"},{"key":"9312_CR15","doi-asserted-by":"crossref","unstructured":"Jiang H, Wang J, Yuan Z, Wu Y, Zheng N, Li S (2013) Salient object detection: a discriminative regional feature integration approach. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2083\u20132090","DOI":"10.1109\/CVPR.2013.271"},{"key":"9312_CR16","doi-asserted-by":"crossref","unstructured":"Kim J, Han D, Tai Y-W, Kim J (2014) Salient region detection via high-dimensional color transform. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 883\u2013890","DOI":"10.1109\/CVPR.2014.118"},{"key":"9312_CR17","doi-asserted-by":"crossref","unstructured":"Klein DA, Frintrop S (2011) Center-surround divergence of feature statistics for salient object detection. In: 2011 IEEE international conference on computer vision (ICCV). IEEE, pp 2214\u20132219","DOI":"10.1109\/ICCV.2011.6126499"},{"key":"9312_CR18","unstructured":"Kondor R, Jebara T (2003) A kernel between sets of vectors. In: Proceedings of the 20th international conference on machine learning (ICML-03), pp 361\u2013368"},{"key":"9312_CR19","doi-asserted-by":"crossref","unstructured":"Law-To J, Joly A, Boujemaa N (2007) Muscle-vcd-2007: a live benchmark for video copy detection. http:\/\/www-rocq.inria.fr\/imedia\/civr-bench\/","DOI":"10.1145\/1282280.1282336"},{"key":"9312_CR20","doi-asserted-by":"crossref","unstructured":"Liu J, Luo J, Shah M (2009) Recognizing realistic actions from videos in the wild. Citeseer","DOI":"10.1109\/CVPR.2009.5206744"},{"key":"9312_CR21","unstructured":"Lyu S (2005) Mercer kernels for object recognition with local features. In: 2005 IEEE Computer Society conference on computer vision and pattern recognition (CVPR\u201905), vol 2. IEEE, pp 223\u2013229"},{"key":"9312_CR22","doi-asserted-by":"crossref","unstructured":"Mallick AK, Mukhopadhyay S (2019) Video retrieval based on motion vector key frame extraction and spatial pyramid matching. In: 2019 6th International conference on signal processing and integrated networks (SPIN). IEEE, pp 687\u2013692","DOI":"10.1109\/SPIN.2019.8711781"},{"issue":"8","key":"9312_CR23","doi-asserted-by":"publisher","first-page":"873","DOI":"10.1109\/34.946990","volume":"23","author":"G Medioni","year":"2001","unstructured":"Medioni G, Cohen I, Br\u00e9mond F, Hongeng S, Nevatia R (2001) Event detection and analysis from video streams. IEEE Trans Pattern Anal Mach Intell 23(8):873\u2013889","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"3","key":"9312_CR24","doi-asserted-by":"publisher","first-page":"790","DOI":"10.1016\/j.compeleceng.2012.11.020","volume":"39","author":"E Mendi","year":"2013","unstructured":"Mendi E, Clemente HB, Bayrak C (2013) Sports video summarization based on motion analysis. Comput Electr Eng 39(3):790\u2013796","journal-title":"Comput Electr Eng"},{"key":"9312_CR25","doi-asserted-by":"crossref","unstructured":"Perazzi F, Kr\u00e4henb\u00fchl P, Pritch Y, Hornung A (2012) Saliency filters: contrast based filtering for salient region detection. In: 2012 IEEE conference on computer vision and pattern recognition (CVPR). IEEE, pp 733\u2013740","DOI":"10.1109\/CVPR.2012.6247743"},{"key":"9312_CR26","doi-asserted-by":"crossref","unstructured":"Qiang Z, Xu Q, Sun S, Sbert M (2016) Key frame extraction based on motion vector. In: Pacific rim conference on multimedia. Springer, pp 387\u2013395","DOI":"10.1007\/978-3-319-48896-7_38"},{"key":"9312_CR27","unstructured":"Shashua A, Hazan T (2005) Algebraic set kernels with application to inference over local image representations. In: Advances in neural information processing systems, pp 1257\u20131264"},{"issue":"11","key":"9312_CR28","doi-asserted-by":"publisher","first-page":"1587","DOI":"10.1109\/TCSVT.2008.2005607","volume":"18","author":"J Shen","year":"2008","unstructured":"Shen J, Tao D, Li X (2008) Modality mixture projections for semantic video event detection. IEEE Trans Circ Syst Video Technol 18(11):1587\u20131596","journal-title":"IEEE Trans Circ Syst Video Technol"},{"issue":"2","key":"9312_CR29","doi-asserted-by":"publisher","first-page":"252","DOI":"10.1109\/TMM.2007.911830","volume":"10","author":"M-L Shyu","year":"2008","unstructured":"Shyu M-L, Xie Z, Chen M, Chen S-C (2008) Video semantic event\/concept detection using a subspace-based multimedia data mining framework. IEEE Trans Multimed 10(2):252\u2013259","journal-title":"IEEE Trans Multimed"},{"key":"9312_CR30","doi-asserted-by":"crossref","unstructured":"Siva P, Russell C, Xiang T, Agapito L (2013) Looking beyond the image: Unsupervised learning for object saliency and detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3238\u20133245","DOI":"10.1109\/CVPR.2013.416"},{"key":"9312_CR31","doi-asserted-by":"publisher","first-page":"103557","DOI":"10.1016\/j.engappai.2020.103557","volume":"90","author":"N Spola\u00f4r","year":"2020","unstructured":"Spola\u00f4r N, Lee HD, Takaki WSR, Ensina LA, Coy CSR, Wu FC (2020) A systematic review on content-based video retrieval. Eng Appl Artif Intell 90:103557","journal-title":"Eng Appl Artif Intell"},{"key":"9312_CR32","doi-asserted-by":"crossref","unstructured":"Su B, Lu S, Tan CL (2011) Blurred image region detection and classification. In: Proceedings of the 19th ACM international conference on multimedia. ACM, pp 1397\u20131400","DOI":"10.1145\/2072298.2072024"},{"issue":"2","key":"9312_CR33","first-page":"133","volume":"23","author":"SP Verma","year":"2006","unstructured":"Verma SP, Ruiz AQ (2006) Critical values for six dixon tests for outliers in normal samples up to sizes 100, and applications in science and engineering. Rev Mex Cienc Geol 23(2):133\u2013161","journal-title":"Rev Mex Cienc Geol"},{"key":"9312_CR34","doi-asserted-by":"crossref","unstructured":"Wallraven C, Caputo B, Graf A (2003) Recognition with local features: the kernel recipe. In: null. IEEE, p 257","DOI":"10.1109\/ICCV.2003.1238351"},{"issue":"3","key":"9312_CR35","doi-asserted-by":"publisher","first-page":"634","DOI":"10.1109\/TMM.2017.2749159","volume":"20","author":"X Wang","year":"2017","unstructured":"Wang X, Gao L, Wang P, Sun X, Liu X (2017) Two-stream 3-d convnet fusion for action recognition in videos with arbitrary size and length. IEEE Trans Multimed 20(3):634\u2013644","journal-title":"IEEE Trans Multimed"},{"issue":"5","key":"9312_CR36","doi-asserted-by":"publisher","first-page":"461","DOI":"10.4103\/0377-2063.90172","volume":"57","author":"KK Warhade","year":"2011","unstructured":"Warhade KK, Merchant SN (2011) Performance evaluation of shot boundary detection metrics in the presence of object and camera motion. IETE J Res 57(5):461\u2013466","journal-title":"IETE J Res"},{"issue":"3","key":"9312_CR37","doi-asserted-by":"publisher","first-page":"1053","DOI":"10.1007\/s11042-013-1530-9","volume":"73","author":"B Wu","year":"2014","unstructured":"Wu B, Xu L (2014) Integrating bottom-up and top-down visual stimulus for saliency detection in news video. Multimed Tools Appl 73(3):1053\u20131075","journal-title":"Multimed Tools Appl"},{"key":"9312_CR38","doi-asserted-by":"crossref","unstructured":"Wu G, Liu L, Guo Y, Ding G, Han J, Shen J, Shao L (2017) Unsupervised deep video hashing with balanced rotation. In: IJCAI","DOI":"10.24963\/ijcai.2017\/429"},{"key":"9312_CR39","doi-asserted-by":"publisher","first-page":"736","DOI":"10.1016\/j.ins.2014.03.088","volume":"278","author":"Q Xu","year":"2014","unstructured":"Xu Q, Liu Y, Li X, Yang Z, Wang J, Sbert M, Scopigno R (2014) Browsing and exploration of video sequences: a new scheme for key frame extraction and 3d visualization using entropy based Jensen divergence. Inf Sci 278:736\u2013756","journal-title":"Inf Sci"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-09312-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-020-09312-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-09312-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,5]],"date-time":"2022-11-05T04:40:06Z","timestamp":1667623206000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-020-09312-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7,30]]},"references-count":39,"journal-issue":{"issue":"37-38","published-print":{"date-parts":[[2020,10]]}},"alternative-id":["9312"],"URL":"https:\/\/doi.org\/10.1007\/s11042-020-09312-8","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2020,7,30]]},"assertion":[{"value":"19 September 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 June 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 July 2020","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 July 2020","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}