{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T06:46:47Z","timestamp":1764226007869,"version":"3.28.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,7,15]],"date-time":"2024-07-15T00:00:00Z","timestamp":1721001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,15]],"date-time":"2024-07-15T00:00:00Z","timestamp":1721001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62272409"],"award-info":[{"award-number":["62272409"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,7,15]]},"DOI":"10.1109\/icmew63481.2024.10645427","type":"proceedings-article","created":{"date-parts":[[2024,8,29]],"date-time":"2024-08-29T17:43:36Z","timestamp":1724953416000},"page":"1-6","source":"Crossref","is-referenced-by-count":3,"title":["Popular Hooks: A Multimodal Dataset of Musical Hooks for Music Understanding and Generation"],"prefix":"10.1109","author":[{"given":"Xinda","family":"Wu","sequence":"first","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Jiaming","family":"Wang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Jiaxing","family":"Yu","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Tieyao","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]},{"given":"Kejun","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Zhejiang University,Hangzhou,China"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref1","DOI":"10.1007\/978-3-030-69808-9"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/ICCV51070.2023.01433"},{"key":"ref3","article-title":"Songdriver2: Real-time emotion-based music arrangement with soft transition","author":"Wang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref4","article-title":"M2UGen: Multi-modal Music Understanding and Generation with the Power of Large Language Models","author":"Hussain","year":"2023","journal-title":"arXiv preprint"},{"volume-title":"International Society for Music Information Retrieval Conference","author":"Hung","article-title":"Emopia: A multi-modal pop piano dataset for emotion recognition and emotion-based music generation","key":"ref5"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.1109\/ICASSP49357.2023.10096956"},{"key":"ref7","first-page":"28492","article-title":"Robust speech recognition via large-scale weak super-vision","volume-title":"International Conference on Machine Learning","author":"Radford"},{"doi-asserted-by":"publisher","key":"ref8","DOI":"10.1037\/h0077714"},{"volume-title":"International Society for Music Information Retrieval Conference, 2020","author":"Wang","article-title":"Pop909: A pop-song dataset for music arrangement generation","key":"ref9"},{"volume-title":"Learning-based methods for comparing sequences, with applications to audio-to-midi alignment and matching","year":"2016","author":"Raffel","key":"ref10"},{"key":"ref11","article-title":"Melodyglm: Multi-task pre-training for symbolic melody generation","author":"Wu","year":"2023","journal-title":"arXiv preprint"},{"doi-asserted-by":"publisher","key":"ref12","DOI":"10.1109\/TMM.2018.2856090"},{"key":"ref13","article-title":"Midibert-piano: large-scale pre-training for symbolic music understanding","author":"Chou","year":"2021","journal-title":"arXiv preprint"},{"doi-asserted-by":"publisher","key":"ref14","DOI":"10.18653\/v1\/2021.findings-acl.70"},{"key":"ref15","article-title":"Wuyun: exploring hierarchical skeleton-guided melody generation using knowledge-enhanced deep learning","author":"Zhang","year":"2023","journal-title":"arXiv preprint"},{"issue":"1","key":"ref16","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3597493","article-title":"A survey on deep learning for symbolic music generation: Representations, algorithms, evaluations, and challenges","volume":"56","author":"Ji","year":"2023","journal-title":"ACM Computing Surveys"},{"doi-asserted-by":"publisher","key":"ref17","DOI":"10.1109\/ICMLA.2018.00114"},{"key":"ref18","article-title":"Modeling the rhythm from lyrics for melody generation of pop songs","volume-title":"International Society for Music Information Retrieval Conference","author":"Zhang","year":"2022"},{"doi-asserted-by":"publisher","key":"ref19","DOI":"10.1109\/TMM.2023.3276177"},{"key":"ref20","first-page":"10078","article-title":"Videomae: Masked autoen-coders are data-efficient learners for self-supervised video pre-training","volume":"35","author":"Tong","year":"2022","journal-title":"Advances in neural information processing systems"},{"doi-asserted-by":"publisher","key":"ref21","DOI":"10.1007\/s11042-020-08836-3"},{"doi-asserted-by":"publisher","key":"ref22","DOI":"10.1109\/TAFFC.2021.3101563"},{"doi-asserted-by":"publisher","key":"ref23","DOI":"10.1371\/journal.pone.0173392"},{"doi-asserted-by":"publisher","key":"ref24","DOI":"10.18653\/v1\/P19-1493"},{"doi-asserted-by":"publisher","key":"ref25","DOI":"10.18653\/v1\/E17-2092"},{"doi-asserted-by":"publisher","key":"ref26","DOI":"10.18653\/v1\/N16-1066"},{"doi-asserted-by":"publisher","key":"ref27","DOI":"10.1093\/hcr\/30.3.411"},{"key":"ref28","article-title":"Midi miner-a python library for tonal tension and track classification","author":"Guo","year":"2019","journal-title":"arXiv preprint"},{"doi-asserted-by":"publisher","key":"ref29","DOI":"10.1609\/aaai.v35i1.16091"},{"doi-asserted-by":"publisher","key":"ref30","DOI":"10.1145\/3394171.3413721"}],"event":{"name":"2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","start":{"date-parts":[[2024,7,15]]},"location":"Niagara Falls, ON, Canada","end":{"date-parts":[[2024,7,19]]}},"container-title":["2024 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10645349\/10645352\/10645427.pdf?arnumber=10645427","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T04:47:25Z","timestamp":1725338845000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10645427\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,15]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/icmew63481.2024.10645427","relation":{},"subject":[],"published":{"date-parts":[[2024,7,15]]}}}