{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T17:10:35Z","timestamp":1776964235346,"version":"3.51.4"},"reference-count":65,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62132012"],"award-info":[{"award-number":["62132012"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61972216"],"award-info":[{"award-number":["61972216"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/tmm.2022.3183394","type":"journal-article","created":{"date-parts":[[2022,6,15]],"date-time":"2022-06-15T20:02:52Z","timestamp":1655323372000},"page":"4894-4908","source":"Crossref","is-referenced-by-count":18,"title":["Multimodal-Based and Aesthetic-Guided Narrative Video Summarization"],"prefix":"10.1109","volume":"25","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9003-1975","authenticated-orcid":false,"given":"Jiehang","family":"Xie","sequence":"first","affiliation":[{"name":"TKLNDST, CS, Nankai University, Nankai, China"}]},{"given":"Xuanbai","family":"Chen","sequence":"additional","affiliation":[{"name":"TKLNDST, CS, Nankai University, Nankai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6293-881X","authenticated-orcid":false,"given":"Tianyi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Centrum Wiskunde and Informatica, Amsterdam, Netherlands"}]},{"given":"Yixuan","family":"Zhang","sequence":"additional","affiliation":[{"name":"TKLNDST, CS, Nankai University, Nankai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8492-0925","authenticated-orcid":false,"given":"Shao-Ping","family":"Lu","sequence":"additional","affiliation":[{"name":"TKLNDST, CS, Nankai University, Nankai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1752-6837","authenticated-orcid":false,"given":"Pablo","family":"Cesar","sequence":"additional","affiliation":[{"name":"Centrum Wiskunde and Informatica, Amsterdam, Netherlands"}]},{"given":"Yulu","family":"Yang","sequence":"additional","affiliation":[{"name":"TKLNDST, CS, Nankai University, Nankai, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2930041"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2018.2848260"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00174"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TIE.2019.2931283"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2708981"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2984511.2984569"},{"key":"ref7","first-page":"39","article-title":"Summarizing videos with attention","volume-title":"Proc. Asian Conf. Comput. Vis","author":"Fajtl","year":"2018"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00773"},{"issue":"6","key":"ref9","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3355398","article-title":"Survey of compressed domain video summarization techniques","volume":"52","author":"Basavarajaiah","year":"2019","journal-title":"ACM Comput. Surv."},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2019.2929618"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806386"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2705915"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.3039886"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2623699"},{"issue":"7","key":"ref15","first-page":"1218","article-title":"Timeline editing of objects in video","volume":"19","author":"Lu","year":"2012","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2951680"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00778"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.12255"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2959451"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01237-3_24"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/2822907"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1099"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.125"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.556"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.451"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/2642918.2647400"},{"key":"ref27","first-page":"1","article-title":"Coot: Cooperative hierarchical transformer for video-text representation learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ging","year":"2020"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3414053"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413841"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33018199"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019062"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2852750"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.585"},{"key":"ref34","first-page":"2520","article-title":"The excitement of sports: Automatic highlights using audio\/visual cues","volume-title":"Proc. IEEE Conf. Comput.Vis. Pattern Recognit","author":"Merler","year":"2018"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3087001"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2876046"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v31i1.10754"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICME51207.2021.9428252"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2428998"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/2659520"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2012.2189689"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300311"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1145\/3355089.3356520"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/BigMM.2017.19"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413498"},{"key":"ref46","volume-title":"Introduction to Information Retrieval","volume":"39","author":"Schtze","year":"2008"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1100"},{"key":"ref48","first-page":"6000","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Vaswani","year":"2017"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1063"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01082"},{"key":"ref51","first-page":"1","article-title":"Compositional attention networks for machine reasoning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Hudson","year":"2018"},{"key":"ref52","first-page":"1","article-title":"Hadamard product for low-rank bilinear pooling","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kim","year":"2017"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1007\/11744023_32"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.21105\/joss.02154"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053512"},{"key":"ref57","first-page":"5179","article-title":"Tvsum: Summarizing web videos using titles","volume-title":"Proc. IEEE Conf. Comput.Vis. Pattern Recognit","author":"Song","year":"2015"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298940"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01258-8_22"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.10.039"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00809"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/K16-1028"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.563"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref65","article-title":"Subjective video quality assessment methods for multimedia applications","year":"2008"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/10016790\/09797228.pdf?arnumber=9797228","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,11]],"date-time":"2024-01-11T23:44:27Z","timestamp":1705016667000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9797228\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":65,"URL":"https:\/\/doi.org\/10.1109\/tmm.2022.3183394","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}