{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T16:19:15Z","timestamp":1775578755807,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":47,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Ministry of Education (Singapore)","award":["MOE2018-T2-2-161"],"award-info":[{"award-number":["MOE2018-T2-2-161"]}]},{"DOI":"10.13039\/501100001348","name":"Agency for Science, Technology and Research (A*STAR)","doi-asserted-by":"publisher","award":["SING-2018-02-0204"],"award-info":[{"award-number":["SING-2018-02-0204"]}],"id":[{"id":"10.13039\/501100001348","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Singapore University of Technology and Design","award":["SRG ISTD 2017 129"],"award-info":[{"award-number":["SRG ISTD 2017 129"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1145\/3474085.3475405","type":"proceedings-article","created":{"date-parts":[[2021,10,18]],"date-time":"2021-10-18T06:21:10Z","timestamp":1634538070000},"page":"3918-3926","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":25,"title":["ReconVAT: A Semi-Supervised Automatic Music Transcription Framework for Low-Resource Real-World Data"],"prefix":"10.1145","author":[{"given":"Kin Wai","family":"Cheuk","sequence":"first","affiliation":[{"name":"Singapore University of Technology and Design, Singapore, Singapore"}]},{"given":"Dorien","family":"Herremans","sequence":"additional","affiliation":[{"name":"Singapore University of Technology and Design, Singapore, Singapore"}]},{"given":"Li","family":"Su","sequence":"additional","affiliation":[{"name":"Academia Sinica, Taiwan, Taiwan Roc"}]}],"member":"320","published-online":{"date-parts":[[2021,10,17]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.5555\/3045390.3045410"},{"key":"e_1_3_2_2_2_1","unstructured":"Mert Bay Andreas F Ehmann and J Stephen Downie. 2009. Evaluation of Multiple-F0 Estimation and Tracking Systems. In ISMIR. 315--320.  Mert Bay Andreas F Ehmann and J Stephen Downie. 2009. Evaluation of Multiple-F0 Estimation and Tracking Systems. In ISMIR. 315--320."},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2018.2869928"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10844-013-0258-3"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.5555\/2968826.2968998"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8170013"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/502585.502625"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.777"},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3019084"},{"key":"e_1_3_2_2_12_1","volume-title":"International Conference on Pattern Recognition (ICPR). IEEE","author":"Cheuk Kin Wai","year":"2020"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9533407"},{"key":"e_1_3_2_2_14_1","unstructured":"Keunwoo Choi and Kyunghyun Cho. 2019. Deep Unsupervised Drum Transcription. In ISMIR Arthur Flexer Geoffroy Peeters Juli\u00e1 n Urbano and Anja Volk (Eds.). 183--191. http:\/\/archives.ismir.net\/ismir2019\/paper\/000020.pdf  Keunwoo Choi and Kyunghyun Cho. 2019. Deep Unsupervised Drum Transcription. In ISMIR Arthur Flexer Geoffroy Peeters Juli\u00e1 n Urbano and Anja Volk (Eds.). 183--191. http:\/\/archives.ismir.net\/ismir2019\/paper\/000020.pdf"},{"key":"e_1_3_2_2_15_1","unstructured":"Michael Scott Cuthbert and Christopher Ariza. 2010. music21: A toolkit for computer-aided musicology and symbolic music data. In ISMIR.  Michael Scott Cuthbert and Christopher Ariza. 2010. music21: A toolkit for computer-aided musicology and symbolic music data. In ISMIR."},{"key":"e_1_3_2_2_16_1","volume-title":"MAPS-A piano database for multipitch estimation and automatic transcription of music. Hal Inria","author":"Emiya Valentin","year":"2010"},{"key":"e_1_3_2_2_17_1","volume-title":"Explaining and Harnessing Adversarial Examples. In International Conference on Learning Representations.","author":"Goodfellow Ian","year":"2015"},{"key":"e_1_3_2_2_18_1","unstructured":"Curtis Hawthorne Erich Elsen Jialin Song Adam Roberts Ian Simon Colin Raffel Jesse Engel Sageev Oore and Douglas Eck. 2017. Onsets and Frames: Dual-Objective Piano Transcription. In ISMIR.  Curtis Hawthorne Erich Elsen Jialin Song Adam Roberts Ian Simon Colin Raffel Jesse Engel Sageev Oore and Douglas Eck. 2017. Onsets and Frames: Dual-Objective Piano Transcription. In ISMIR."},{"key":"e_1_3_2_2_19_1","volume-title":"Enabling Factorized Piano Music Modeling and Generation with the MAESTRO Dataset. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=r1lYRjC9F7","author":"Hawthorne Curtis","year":"2019"},{"key":"e_1_3_2_2_20_1","volume-title":"Pop Music Transformer: Generating Music with Rhythm and Harmony. arXiv preprint arXiv:2002.00212","author":"Huang Yu-Siang","year":"2020"},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/3367471.3367696"},{"key":"e_1_3_2_2_22_1","volume-title":"Proceedings of the 16th sound & music computing conference. 65--71","author":"Jiang Zheng","year":"2019"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683582"},{"key":"e_1_3_2_2_24_1","volume-title":"Adversarial Learning for Improved Onsets and Frames Music Transcription. International Society forMusic Information Retrieval Conference","author":"Kim Jong Wook","year":"2019"},{"key":"e_1_3_2_2_25_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","author":"Kingma Diederik P","year":"2014"},{"key":"e_1_3_2_2_26_1","volume-title":"Large-Scale MIDI-based Composer Classification. arXiv preprint arXiv:2010.14805","author":"Kong Qiuqiang","year":"2020"},{"key":"e_1_3_2_2_27_1","volume-title":"Cosine-distance virtual adversarial training for semi-supervised speaker-discriminative acoustic embeddings. Interspeech","author":"Kreyssig Florian L","year":"2020"},{"key":"e_1_3_2_2_28_1","volume-title":"Model Smoothing Using Virtual Adversarial Training for Speech Emotion Estimation. In 2019 IEEE International Conference on Big Data, Cloud Computing, Data Science & Engineering (BCD). IEEE, 60--64","author":"Kuwahara Toyoaki","year":"2019"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSP51882.2021.9408762"},{"key":"e_1_3_2_2_31_1","volume-title":"CHORDIFY: THREE YEARS AFTER THE LAUNCH. In ISMIR.","author":"Magalhaes Jos\u00e9 Pedro","year":"2015"},{"key":"e_1_3_2_2_32_1","volume-title":"International Semantic Web Conference. Springer, 156--164","author":"Albert Mero","year":"2017"},{"key":"e_1_3_2_2_33_1","volume-title":"Adversarial training methods for semi-supervised text classification. ICLR","author":"Miyato Takeru","year":"2016"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2858821"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3308558.3313416"},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9052987"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.5555\/3454287.3454294"},{"key":"e_1_3_2_2_38_1","volume-title":"Antonio Pertusa, and Jorge Calvo-Zaragoza.","author":"Miguel","year":"2018"},{"key":"e_1_3_2_2_39_1","volume-title":"Antonio Pertusa, and Jorge Calvo-Zaragoza.","author":"Miguel","year":"2019"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-2074"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2016.2533858"},{"key":"e_1_3_2_2_42_1","first-page":"973","article-title":"Query by singing\/humming system based on deep learning","volume":"12","author":"Sun JQ","year":"2017","journal-title":"Int. J. Appl. Eng. Res"},{"key":"e_1_3_2_2_43_1","volume-title":"Invariances and Data Augmentation for Supervised Music Transcription. 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","author":"Thickstun John","year":"2017"},{"key":"e_1_3_2_2_44_1","volume-title":"Kakade","author":"Thickstun John","year":"2016"},{"key":"e_1_3_2_2_45_1","volume-title":"Toward Interpretable Music Tagging with Self-Attention. arxiv","author":"Won Minz","year":"1906"},{"key":"e_1_3_2_2_46_1","volume-title":"Polyphonic Music Transcription with Semantic Segmentation. In ICASSP 2019 - 2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). 166--170","author":"Wu Yu-Te","year":"2019"},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/taslp.2020.3030482"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/SNPD.2019.8935654"}],"event":{"name":"MM '21: ACM Multimedia Conference","location":"Virtual Event China","acronym":"MM '21","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 29th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475405","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3474085.3475405","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:48:32Z","timestamp":1750193312000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475405"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":47,"alternative-id":["10.1145\/3474085.3475405","10.1145\/3474085"],"URL":"https:\/\/doi.org\/10.1145\/3474085.3475405","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]},"assertion":[{"value":"2021-10-17","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}