{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,31]],"date-time":"2025-10-31T07:11:15Z","timestamp":1761894675726,"version":"build-2065373602"},"reference-count":49,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,30]]},"DOI":"10.1109\/icme59968.2025.11209961","type":"proceedings-article","created":{"date-parts":[[2025,10,30]],"date-time":"2025-10-30T17:57:42Z","timestamp":1761847062000},"page":"1-6","source":"Crossref","is-referenced-by-count":0,"title":["Synopses of Movie Narratives: a Video-Language Dataset for Story Understanding"],"prefix":"10.1109","author":[{"given":"Yidan","family":"Sun","sequence":"first","affiliation":[{"name":"Nanyang Technological University,School of Computer Science and Engineering,Singapore,Singapore"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qin","family":"Chao","sequence":"additional","affiliation":[{"name":"Nanyang Technological University,School of Computer Science and Engineering,Singapore,Singapore"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yangfeng","family":"Ji","sequence":"additional","affiliation":[{"name":"University of Virginia,Department of Computer Science,Charlottesville,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Boyang","family":"Li","sequence":"additional","affiliation":[{"name":"Nanyang Technological University,School of Computer Science and Engineering,Singapore,Singapore"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2021.emnlp-main.54","article-title":"Moral stories: Situated reasoning about norms, intents, actions, and their consequences","volume-title":"EMNLP","author":"Emelin"},{"key":"ref2","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2020.emnlp-main.51","article-title":"Joint constrained learning for event-event relation extraction","volume-title":"EMNLP","author":"Wang"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10358"},{"article-title":"Frowning frodo, wincing leia, and a seriously great friendship: Learning to classify emotional relationships of fictional characters","volume-title":"NAACL","author":"Kim","key":"ref4"},{"article-title":"Unsupervised learning of narrative event chains","volume-title":"ACL","author":"Chambers","key":"ref5"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10328"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.501"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2017\/280"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298792"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0987-1"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00497"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.257"},{"key":"ref13","article-title":"The division of labor in society","volume-title":"Social stratification","author":"Durkheim","year":"2018"},{"key":"ref14","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-030-69541-5_28","article-title":"Condensed movies: Story based retrieval with contextual embeddings","volume-title":"ACCV","author":"Bain"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00192"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00912"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/tmm.2023.3296944"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.686"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00895"},{"article-title":"Computational narrative intelligence: A human-centered goal for artificial intelligence","year":"2016","author":"Riedl","key":"ref20"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00071"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3393452"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58610-2_11"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19836-6_5"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"375","DOI":"10.4324\/9781315802671","article-title":"Plot units: A narrative summarization strategy","volume-title":"Strategies for natural language processing","author":"Lehnert","year":"2014"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1082"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00553"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1147"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01815"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00959"},{"key":"ref31","article-title":"Punctuation restoration using transformer models for resource-rich and-poor languages","author":"Alam","year":"2020","journal-title":"W-NUT"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3685517"},{"volume-title":"A dictionary of narratology","year":"2003","author":"Prince","key":"ref33"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"article-title":"Using dynamic time warping to find patterns in time series","volume-title":"KDD workshop","author":"Berndt","key":"ref35"},{"key":"ref36","article-title":"Learning knowledge to support domain-independent narrative intelligence","volume-title":"Ph.D. thesis","author":"Li","year":"2015"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-02147-3"},{"article-title":"Univl: A unified video and language pre-training model for multimodal understanding and generation","year":"2020","author":"Luo","key":"ref38"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.315"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2022.07.028"},{"article-title":"Blip-2: Bootstrapping language-image pre-training with frozen image encoders and large language models","volume-title":"ICML","author":"Li","key":"ref41"},{"article-title":"Internvid: A large-scale video-text dataset for multimodal understanding and generation","volume-title":"ICLR","author":"Wang","key":"ref42"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"ref44","doi-asserted-by":"crossref","DOI":"10.3115\/1073083.1073135","article-title":"Bleu: a method for automatic evaluation of machine translation","volume-title":"ACL","author":"Papineni"},{"article-title":"Bertscore: Evaluating text generation with BERT","volume-title":"ICLR","author":"Zhang","key":"ref45"},{"article-title":"Gpt-4 technical report","year":"2023","author":"Achiam","key":"ref46"},{"article-title":"Instructblip: Towards general-purpose vision-language models with instruction tuning","volume-title":"NeurIPS","author":"Dai","key":"ref47"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-024-4231-5"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01032"}],"event":{"name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","start":{"date-parts":[[2025,6,30]]},"location":"Nantes, France","end":{"date-parts":[[2025,7,4]]}},"container-title":["2025 IEEE International Conference on Multimedia and Expo (ICME)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11208895\/11208897\/11209961.pdf?arnumber=11209961","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,31]],"date-time":"2025-10-31T05:33:11Z","timestamp":1761888791000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11209961\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,30]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/icme59968.2025.11209961","relation":{},"subject":[],"published":{"date-parts":[[2025,6,30]]}}}