{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T08:35:20Z","timestamp":1774600520917,"version":"3.50.1"},"publisher-location":"Cham","reference-count":46,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319464831","type":"print"},{"value":"9783319464848","type":"electronic"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-46484-8_1","type":"book-chapter","created":{"date-parts":[[2016,9,16]],"date-time":"2016-09-16T08:35:32Z","timestamp":1474014932000},"page":"3-19","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":88,"title":["Query-Focused Extractive Video Summarization"],"prefix":"10.1007","author":[{"given":"Aidean","family":"Sharghi","sequence":"first","affiliation":[]},{"given":"Boqing","family":"Gong","sequence":"additional","affiliation":[]},{"given":"Mubarak","family":"Shah","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,9,17]]},"reference":[{"key":"1_CR1","doi-asserted-by":"crossref","unstructured":"Pritch, Y., Rav-Acha, A., Gutman, A., Peleg, S.: Webcam synopsis: peeking around the world. In: IEEE 11th International Conference on Computer Vision 2007, ICCV 2007, pp. 1\u20138. IEEE (2007)","DOI":"10.1109\/ICCV.2007.4408934"},{"key":"1_CR2","doi-asserted-by":"crossref","unstructured":"Pal, C., Jojic, N.: Interactive montages of sprites for indexing and summarizing security video. In: IEEE Computer Society Conference on CVPR 2005, vol. 2. IEEE (2005)","DOI":"10.1109\/CVPR.2005.192"},{"key":"1_CR3","unstructured":"Kang, H.W., Matsushita, Y., Tang, X., Chen, X.Q.: Space-time video montage. In: IEEE Computer Society Conference on CVPR 2006, vol. 2. IEEE (2006)"},{"key":"1_CR4","series-title":"Studies in Computational Intelligence","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1007\/978-3-642-02900-4_2","volume-title":"Recent Advances in Multimedia Signal Processing and Communications","author":"RM Jiang","year":"2009","unstructured":"Jiang, R.M., Sadka, A.H., Crookes, D.: Advances in video summarization and skimming. In: Grgic, M., Delac, K., Ghanbari, M. (eds.) Recent Advances in Multimedia Signal Processing and Communications. SCI, vol. 231, pp. 27\u201350. Springer, Heidelberg (2009)"},{"key":"1_CR5","doi-asserted-by":"crossref","unstructured":"Rav-Acha, A., Pritch, Y., Peleg, S.: Making a long video short: dynamic video synopsis. In: 2006 IEEE Computer Society Conference on CVPR, vol. 1. IEEE (2006)","DOI":"10.1109\/CVPR.2006.179"},{"key":"1_CR6","doi-asserted-by":"publisher","first-page":"862","DOI":"10.1145\/1141911.1141967","volume":"25","author":"DB Goldman","year":"2006","unstructured":"Goldman, D.B., Curless, B., Salesin, D., Seitz, S.M.: Schematic storyboarding for video visualization and editing. ACM Trans. Graph. (TOG) 25, 862\u2013871 (2006). ACM","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1007\/3-540-47979-1_27","volume-title":"Computer Vision \u2014 ECCV 2002","author":"T Liu","year":"2002","unstructured":"Liu, T., Kender, J.R.: Optimization algorithms for the selection of key frame sequences of variable length. In: Heyden, A., Sparr, G., Nielsen, M., Johansen, P. (eds.) ECCV 2002. LNCS, vol. 2353, pp. 403\u2013417. Springer, Heidelberg (2002)"},{"key":"1_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1007\/3-540-47979-1_26","volume-title":"Computer Vision \u2014 ECCV 2002","author":"A Aner","year":"2002","unstructured":"Aner, A., Kender, J.R.: Video summaries through mosaic-based shot and scene clustering. In: Heyden, A., Sparr, G., Nielsen, M., Johansen, P. (eds.) ECCV 2002. LNCS, vol. 2353, pp. 388\u2013402. Springer, Heidelberg (2002)"},{"key":"1_CR9","doi-asserted-by":"crossref","unstructured":"Vasconcelos, N., Lippman, A.: A spatiotemporal motion model for video summarization. In: Proceedings of IEEE Computer Society Conference on CVPR 1998, pp. 361\u2013366. IEEE (1998)","DOI":"10.1109\/CVPR.1998.698631"},{"key":"1_CR10","doi-asserted-by":"crossref","unstructured":"Wolf, W.: Key frame selection by motion analysis. In: Proceedings of 1996 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 1996, vol. 2, pp. 1228\u20131231. IEEE (1996)","DOI":"10.1109\/ICASSP.1996.543588"},{"key":"1_CR11","unstructured":"Lee, K.M., Kwon, J.: A unified framework for event summarization and rare event detection. In: 2012 IEEE Conference on CVPR. IEEE (2012)"},{"issue":"1","key":"1_CR12","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1109\/TMM.2011.2166951","volume":"14","author":"Y Cong","year":"2012","unstructured":"Cong, Y., Yuan, J., Luo, J.: Towards scalable summarization of consumer videos via sparse dictionary selection. IEEE Trans. Multimedia 14(1), 66\u201375 (2012)","journal-title":"IEEE Trans. Multimedia"},{"key":"1_CR13","unstructured":"Ngo, C., Ma, Y., Zhang, H.: Automatic video summarization by graph modeling. In: Proceedings of the Ninth IEEE International Conference on Computer Vision 2003. IEEE (2003)"},{"key":"1_CR14","doi-asserted-by":"crossref","unstructured":"Khosla, A., Hamid, R., Lin, C.J., Sundaresan, N.: Large-scale video summarization using web-image priors. In: Proceedings of the IEEE Conference on CVPR (2013)","DOI":"10.1109\/CVPR.2013.348"},{"key":"1_CR15","doi-asserted-by":"crossref","unstructured":"Kim, G., Sigal, L., Xing, E.: Joint summarization of large-scale collections of web images and videos for storyline reconstruction. In: Proceedings of the IEEE Conference on CVPR (2014)","DOI":"10.1109\/CVPR.2014.538"},{"key":"1_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"282","DOI":"10.1007\/978-3-319-10602-1_19","volume-title":"Computer Vision \u2013 ECCV 2014","author":"B Xiong","year":"2014","unstructured":"Xiong, B., Grauman, K.: Detecting snap points in egocentric video with a web photo prior. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014, Part V. LNCS, vol. 8693, pp. 282\u2013298. Springer, Heidelberg (2014)"},{"key":"1_CR17","doi-asserted-by":"crossref","unstructured":"Chu, W.S., Song, Y., Jaimes, A.: Video co-summarization: video summarization by visual co-occurrence. In: Proceedings of the IEEE Conference on CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298981"},{"key":"1_CR18","unstructured":"Song, Y., Vallmitjana, J., Stent, A., Jaimes, A.: TVSum: summarizing web videos using titles. In: Proceedings of the IEEE Conference on CVPR (2015)"},{"key":"1_CR19","doi-asserted-by":"crossref","unstructured":"Liu, W., Mei, T., Zhang, Y., Che, C., Luo, J.: Multi-task deep visual-semantic embedding for video thumbnail selection. In: Proceedings of the IEEE Conference on CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298994"},{"key":"1_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"540","DOI":"10.1007\/978-3-319-10599-4_35","volume-title":"Computer Vision \u2013 ECCV 2014","author":"D Potapov","year":"2014","unstructured":"Potapov, D., Douze, M., Harchaoui, Z., Schmid, C.: Category-specific video summarization. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014, Part VI. LNCS, vol. 8694, pp. 540\u2013555. Springer, Heidelberg (2014)"},{"key":"1_CR21","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"787","DOI":"10.1007\/978-3-319-10590-1_51","volume-title":"Computer Vision \u2013 ECCV 2014","author":"M Sun","year":"2014","unstructured":"Sun, M., Farhadi, A., Seitz, S.: Ranking domain-specific highlights by analyzing edited videos. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014, Part I. LNCS, vol. 8689, pp. 787\u2013802. Springer, Heidelberg (2014)"},{"key":"1_CR22","doi-asserted-by":"crossref","unstructured":"Xu, J., Mukherjee, L., Li, Y., Warner, J., Rehg, J.M., Singh, V.: Gaze-enabled egocentric video summarization via constrained submodular maximization. In: Proceedings of the IEEE Conference on CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298836"},{"key":"1_CR23","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"505","DOI":"10.1007\/978-3-319-10584-0_33","volume-title":"Computer Vision \u2013 ECCV 2014","author":"M Gygli","year":"2014","unstructured":"Gygli, M., Grabner, H., Riemenschneider, H., Van Gool, L.: Creating summaries from user videos. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014, Part VII. LNCS, vol. 8695, pp. 505\u2013520. Springer, Heidelberg (2014)"},{"key":"1_CR24","doi-asserted-by":"crossref","unstructured":"Lu, Z., Grauman, K.: Story-driven summarization for egocentric video. In: Proceedings of the IEEE Conference on CVPR (2013)","DOI":"10.1109\/CVPR.2013.350"},{"issue":"1","key":"1_CR25","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1007\/s11263-014-0794-5","volume":"114","author":"YJ Lee","year":"2015","unstructured":"Lee, Y.J., Grauman, K.: Predicting important objects for egocentric video summarization. Int. J. Comput. Vis. 114(1), 38\u201355 (2015)","journal-title":"Int. J. Comput. Vis."},{"issue":"12","key":"1_CR26","doi-asserted-by":"publisher","first-page":"2178","DOI":"10.1109\/TPAMI.2010.31","volume":"32","author":"D Liu","year":"2010","unstructured":"Liu, D., Hua, G., Chen, T.: A hierarchical visual model for video object summarization. IEEE Trans. Pattern Anal. Mach. Intell. 32(12), 2178\u20132190 (2010)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1_CR27","unstructured":"Gong, B., Chao, W.L., Grauman, K., Sha, F.: Diverse sequential subset selection for supervised video summarization. In: Advances in Neural Information Processing Systems, pp. 2069\u20132077 (2014)"},{"key":"1_CR28","doi-asserted-by":"crossref","unstructured":"Gygli, M., Grabner, H., Van Gool, L.: Video summarization by learning submodular mixtures of objectives. In: Proceedings of the IEEE Conference on CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298928"},{"key":"1_CR29","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1007\/978-1-4614-3223-4_3","volume-title":"Mining Text Data","author":"A Nenkova","year":"2012","unstructured":"Nenkova, A., McKeown, K.: A survey of text summarization techniques. In: Aggarwal, C.C., Zhai, C.X. (eds.) Mining Text Data, pp. 43\u201376. Springer, Heidelberg (2012)"},{"issue":"2-3","key":"1_CR30","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1561\/2200000044","volume":"5","author":"Alex Kulesza","year":"2012","unstructured":"Kulesza, A., Taskar, B.: Determinantal point processes for machine learning. arXiv preprint arXiv:1207.6083 (2012)","journal-title":"Foundations and Trends\u00ae in Machine Learning"},{"key":"1_CR31","unstructured":"Ghosh, J., Lee, Y.J., Grauman, K.: Discovering important people and objects for egocentric video summarization. In: 2012 IEEE Conference on CVPR. IEEE (2012)"},{"key":"1_CR32","unstructured":"Yeung, S., Fathi, A., Fei-Fei, L.: Videoset: Video summary evaluation through text. arXiv preprint arXiv:1406.5824 (2014)"},{"key":"1_CR33","doi-asserted-by":"crossref","unstructured":"Daum\u00e9 III., H., Marcu, D.: Bayesian query-focused summarization. In: Proceedings of the 21st International Conference on Computational Linguistics and the 44th Annual Meeting of the Association for Computational Linguistics. Association for Computational Linguistics (2006)","DOI":"10.3115\/1220175.1220214"},{"key":"1_CR34","doi-asserted-by":"crossref","unstructured":"Schilder, F., Kondadadi, R.: Fastsum: fast and accurate query-based multi-document summarization. In: Proceedings of the 46th Annual Meeting of the Association for Computational Linguistics on Human Language Technologies: Short Papers, pp. 205\u2013208. Association for Computational Linguistics (2008)","DOI":"10.3115\/1557690.1557748"},{"key":"1_CR35","doi-asserted-by":"crossref","unstructured":"Gupta, S., Nenkova, A., Jurafsky, D.: Measuring importance and query relevance in topic-focused multi-document summarization. In: Proceedings of the 45th Annual Meeting of the ACL on Interactive Poster and Demonstration Sessions. Association for Computational Linguistics, pp. 193\u2013196 (2007)","DOI":"10.3115\/1557769.1557825"},{"issue":"4","key":"1_CR36","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1016\/j.jvcir.2010.01.007","volume":"21","author":"M Ellouze","year":"2010","unstructured":"Ellouze, M., Boujemaa, N., Alimi, A.M.: IM(S)$$^{2}$$: interactive movie summarization system. J. Vis. Commun. Image Represent. 21(4), 283\u2013294 (2010)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"1_CR37","doi-asserted-by":"crossref","unstructured":"Xiong, B., Kim, G., Sigal, L.: Storyline representation of egocentric videos with an applications to story-based search. In: Proceedings of the IEEE International CVPR (2015)","DOI":"10.1109\/ICCV.2015.514"},{"key":"1_CR38","doi-asserted-by":"crossref","unstructured":"Kulesza, A., Taskar, B.: Learning determinantal point processes. arXiv preprint arXiv:1202.3738 (2012)","DOI":"10.1561\/9781601986290"},{"key":"1_CR39","unstructured":"Chao, W.L., Gong, B., Grauman, K., Sha, F.: Large-margin determinantal point processes. In: Proceedings of the Conference on Uncertainty in Artificial Intelligence (UAI) (2015)"},{"key":"1_CR40","doi-asserted-by":"crossref","unstructured":"Affandi, R.H., Kulesza, A., Fox, E.B.: Markov determinantal point processes. arXiv preprint arXiv:1210.4850 (2012)","DOI":"10.1561\/9781601986290"},{"key":"1_CR41","doi-asserted-by":"crossref","unstructured":"Borth, D., Chen, T., Ji, R., Chang, S.F.: Sentibank: large-scale ontology and classifiers for detecting sentiment and emotions in visual content. In: Proceedings of the 21st ACM International Conference on Multimedia. ACM (2013)","DOI":"10.1145\/2502081.2502268"},{"issue":"3","key":"1_CR42","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1023\/A:1011139631724","volume":"42","author":"A Oliva","year":"2001","unstructured":"Oliva, A., Torralba, A.: Modeling the shape of the scene: a holistic representation of the spatial envelope. Int. J. Comput. Vsion 42(3), 145\u2013175 (2001)","journal-title":"Int. J. Comput. Vsion"},{"issue":"7","key":"1_CR43","doi-asserted-by":"publisher","first-page":"971","DOI":"10.1109\/TPAMI.2002.1017623","volume":"24","author":"T Ojala","year":"2002","unstructured":"Ojala, T., Pietik\u00e4inen, M., M\u00e4enp\u00e4\u00e4, T.: Multiresolution gray-scale and rotation invariant texture classification with local binary patterns. IEEE Trans. Pattern Anal. Mach. Intell. 24(7), 971\u2013987 (2002)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1_CR44","doi-asserted-by":"crossref","unstructured":"Yu, F., Cao, L., Feris, R., Smith, J., Chang, S.F.: Designing category-level attributes for discriminative visual recognition. In: Proceedings of the IEEE Conference on CVPR (2013)","DOI":"10.1109\/CVPR.2013.105"},{"key":"1_CR45","unstructured":"Lin, C.Y.: Rouge: A package for automatic evaluation of summaries. In: Proceedings of the ACL-04 Workshop, Text Summarization Branches Out, vol. 8 (2004)"},{"key":"1_CR46","doi-asserted-by":"crossref","unstructured":"Zhao, B., Xing, E.: Quasi real-time summarization for consumer videos. In: Proceedings of the IEEE Conference on CVPR (2014)","DOI":"10.1109\/CVPR.2014.322"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2016"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-46484-8_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T19:14:17Z","timestamp":1749582857000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-46484-8_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319464831","9783319464848"],"references-count":46,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-46484-8_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"17 September 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Amsterdam","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"The Netherlands","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 October 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 October 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.eccv2016.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}