{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T18:22:30Z","timestamp":1779906150810,"version":"3.53.1"},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8461329","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:24:48Z","timestamp":1537568688000},"page":"161-165","source":"Crossref","is-referenced-by-count":221,"title":["Crepe: A Convolutional Representation for Pitch Estimation"],"prefix":"10.1109","author":[{"given":"Jong Wook","family":"Kim","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Justin","family":"Salamon","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Peter","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Juan Pablo","family":"Bello","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref30","author":"engel","year":"2017","journal-title":"Neural audio synthesis of musical notes with wavenet autoen-coders"},{"key":"ref10","first-page":"97","article-title":"Accurate short-term analysis of the fundamental frequency and the harmonics-to-noise ratio of a sampled sound","volume":"17","author":"boersma","year":"1993","journal-title":"Proc Institute Phonetic Sciences"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1121\/1.1458024"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1121\/1.2951592"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853678"},{"key":"ref14","article-title":"Comparison of pitch trackers for real-time guitar effects","author":"von dem knesebeck","year":"2010","journal-title":"Proceedings of the International Conference on Digital Audio Effects (DAFx)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639185"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2012.220"},{"key":"ref17","article-title":"Enhanced beat tracking with context-aware neural networks","author":"bock","year":"0","journal-title":"Proc Int Conf on Digital Audio Effects (DAFx) 2011"},{"key":"ref18","article-title":"An analysis\/synthesis framework for automatic f0 annotation of multitrack datasets","author":"salamon","year":"2017","journal-title":"Proceedings of the 18th ISMIR Conference"},{"key":"ref19","article-title":"Deep salience representations for f0 tracking in polyphonic music","author":"bittner","year":"2017","journal-title":"Proceedings of the 18th ISMIR Conference"},{"key":"ref28","article-title":"The audio degradation toolbox and its application to robustness evaluation","author":"mauch","year":"2013","journal-title":"Proceedings of the 14th ISMIR Conference"},{"key":"ref4","author":"zubizarreta","year":"1998","journal-title":"Prosody Focus and Word Order"},{"key":"ref27","article-title":"mir_eval: A transparent implementation of common mir metrics","author":"raffel","year":"2014","journal-title":"Proceedings of the 15th ISMIR Conference"},{"key":"ref3","article-title":"Computer-aided melody note transcription using the tony software: Accuracy and efficiency","author":"mauch","year":"2015","journal-title":"Proceedings of the First International Conference on Technologies for Music Notation and Representation"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1121\/1.1910339"},{"key":"ref29","article-title":"A software framework for musical data augmentation","author":"mcfee","year":"2015","journal-title":"International Society for Music Information Retrieval Conference"},{"key":"ref5","author":"hartmann","year":"1997","journal-title":"Signals Sound and Sensation"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1974.1162598"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1976.1162765"},{"key":"ref2","article-title":"Melody extraction in symphonic classical music: a comparative study of mutual agreement between humans and algorithms","author":"bosch","year":"2014","journal-title":"Proc of the 9th Conference on Interdisciplinary Musicology (CIM14)"},{"key":"ref9","article-title":"A robust algorithm for pitch tracking (rapt)","author":"talkin","year":"1995","journal-title":"Speech Coding and Synthesis"},{"key":"ref1","first-page":"155","article-title":"Medleydb: A multitrack dataset for annotation-intensive mir research","volume":"14","author":"bittner","year":"2014","journal-title":"Proceedings of the 15th ISMIR Conference"},{"key":"ref20","article-title":"Adam: A method for stochastic optimisation","author":"kingma","year":"2015","journal-title":"Proc of the Int Conf on Learning Representations (ICLR)"},{"key":"ref22","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"Journal of Machine Learning Research"},{"key":"ref21","first-page":"448","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","author":"ioffe","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref24","first-page":"287","article-title":"Rwc music database: Popular, classical and jazz music databases","volume":"2","author":"goto","year":"2002","journal-title":"Proceedings of the 3rd Conference on IS"},{"key":"ref23","author":"chollet","year":"0","journal-title":"Keras The Python deep learning library"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2013.2271648"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/s10844-013-0250-y"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Calgary, AB","start":{"date-parts":[[2018,4,15]]},"end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08461329.pdf?arnumber=8461329","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T01:08:02Z","timestamp":1598231282000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8461329\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8461329","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}