{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T09:18:43Z","timestamp":1737105523051,"version":"3.33.0"},"reference-count":12,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,15]]},"DOI":"10.1109\/bigdata62323.2024.10825527","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:23Z","timestamp":1737052283000},"page":"3204-3207","source":"Crossref","is-referenced-by-count":0,"title":["Musical Scene Detection in Comics: Comparing Perception of Humans and GPT-4"],"prefix":"10.1109","author":[{"given":"Megha","family":"Sharma","sequence":"first","affiliation":[{"name":"The University of Tokyo,Department of ICE,Tokyo,Japan"}]},{"given":"Muhammad Taimoor","family":"Haseeb","sequence":"additional","affiliation":[{"name":"Music X Lab MBZUAI,Abu Dhabi,UAE"}]},{"given":"Gus","family":"Xia","sequence":"additional","affiliation":[{"name":"Music X Lab MBZUAI,Abu Dhabi,UAE"}]},{"given":"Yoshimasa","family":"Tsuruoka","sequence":"additional","affiliation":[{"name":"The University of Tokyo,Department of ICE,Tokyo,Japan"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58621-8_44"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447950"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TCIAIG.2012.2212899"},{"article-title":"M2m-gen: A multimodal framework for automated background music generation in japanese manga using large language models","year":"2024","author":"Sharma","key":"ref4"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.actpsy.2014.03.003"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007506220214"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1162\/089120102317341756"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-016-4020-z"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/MMUL.2020.2987895"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/icme57554.2024.10687709"},{"volume-title":"The Anime Sound: An Analytical and Semiotic Study of Contemporary Anime Music.","year":"2023","author":"Rodrigues","key":"ref11"},{"key":"ref12","first-page":"301","article-title":"De-centering the west: East asian philosophies and the ethics of applying artificial intelligence to music","author":"Huang","year":"2021","journal-title":"ISMIR"}],"event":{"name":"2024 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2024,12,15]]},"location":"Washington, DC, USA","end":{"date-parts":[[2024,12,18]]}},"container-title":["2024 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10824975\/10824942\/10825527.pdf?arnumber=10825527","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T08:28:19Z","timestamp":1737102499000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10825527\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,15]]},"references-count":12,"URL":"https:\/\/doi.org\/10.1109\/bigdata62323.2024.10825527","relation":{},"subject":[],"published":{"date-parts":[[2024,12,15]]}}}