{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T00:58:11Z","timestamp":1730249891477,"version":"3.28.0"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,7]]},"DOI":"10.1109\/icme.2018.8486496","type":"proceedings-article","created":{"date-parts":[[2018,10,11]],"date-time":"2018-10-11T22:34:18Z","timestamp":1539297258000},"page":"1-6","source":"Crossref","is-referenced-by-count":4,"title":["Seethevoice: Learning from Music to Visual Storytelling of Shots"],"prefix":"10.1109","author":[{"given":"Wen-Li","family":"Wei","sequence":"first","affiliation":[]},{"given":"Jen-Chun","family":"Lin","sequence":"additional","affiliation":[]},{"given":"Tyng-Luh","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Yi-Hsuan","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Hsin-Min","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Hsiao-Rong","family":"Tyan","sequence":"additional","affiliation":[]},{"given":"Hong-Yuan","family":"Mark Liao","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"journal-title":"The Art of the Storyboard A filmmaker's introduction","year":"2008","author":"hart","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2964292"},{"key":"ref13","first-page":"387","article-title":"Eval-uation of algorithms using games: The case of music tagging","author":"law","year":"2009","journal-title":"Proc ISMIR"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-8655(01)00080-0"},{"key":"ref15","first-page":"1383","article-title":"Deep-net fusion to classify shots in concert videos","year":"2017","journal-title":"Proc ICASSP"},{"key":"ref16","first-page":"1","article-title":"Survey on audiovisual emotion recognition: databases, features, and data fusion strategies","volume":"3","year":"2014","journal-title":"APSIPA TSIP"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2016.7900006"},{"journal-title":"The HTK Book Version 3 4","year":"2006","author":"young","key":"ref18"},{"journal-title":"Digital overdrive Communications & multimedia technology","year":"2011","author":"andrews","key":"ref4"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2015.2416554"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1017\/S0140525X08005293"},{"journal-title":"The filmmaker's eye Learning (and breaking) the rules of cinematic composition Taylor & Francis","year":"2010","author":"mercado","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298878"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.515"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2393347.2393373"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874023"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/N15-1173"}],"event":{"name":"2018 IEEE International Conference on Multimedia and Expo (ICME)","start":{"date-parts":[[2018,7,23]]},"location":"San Diego, CA","end":{"date-parts":[[2018,7,27]]}},"container-title":["2018 IEEE International Conference on Multimedia and Expo (ICME)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8472825\/8486434\/08486496.pdf?arnumber=8486496","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,2,7]],"date-time":"2020-02-07T07:58:32Z","timestamp":1581062312000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8486496\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,7]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/icme.2018.8486496","relation":{},"subject":[],"published":{"date-parts":[[2018,7]]}}}