{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T19:36:10Z","timestamp":1729625770976,"version":"3.28.0"},"reference-count":33,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7471715","type":"proceedings-article","created":{"date-parts":[[2016,6,24]],"date-time":"2016-06-24T01:58:30Z","timestamp":1466733510000},"page":"450-454","source":"Crossref","is-referenced-by-count":4,"title":["Learning to separate vocals from polyphonic mixtures via ensemble methods and structured output prediction"],"prefix":"10.1109","author":[{"given":"M.","family":"McVicar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"R.","family":"Santos-Rodriguez","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"T.","family":"De Bie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.858005"},{"key":"ref32","first-page":"2055","article-title":"Pystruct: learning structured prediction in python","volume":"15","author":"m\u00fcller","year":"2014","journal-title":"The Journal of Machine Learning Research"},{"key":"ref31","first-page":"2825","article-title":"Scikit-learn: Machine learning in python","volume":"12","author":"pedregosa","year":"2011","journal-title":"The Journal of Machine Learning Research"},{"key":"ref30","article-title":"scikit-image: image processing in python","volume":"2","author":"van","year":"2014","journal-title":"PeerJ"},{"key":"ref10","article-title":"Deep karaoke: Extracting vocals using a convolutional deep neural network","author":"simpson","year":"2015","journal-title":"arxiv org abs\/1504 04658"},{"key":"ref11","first-page":"67","article-title":"Real-time online singing voice separation from monaural recordings using robust low-rank modeling","author":"sprechmann","year":"2012","journal-title":"ISMIR"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2012.2213249"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"310","DOI":"10.1109\/TASL.2009.2026503","article-title":"On the improvement of singing voice separation for monaural recordings using the mir-1k dataset","volume":"18","author":"hsu","year":"2010","journal-title":"Audio Speech and Language Processing IEEE Transactions"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178063"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178004"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2134092"},{"key":"ref17","first-page":"777","article-title":"Modeling musical emotion dynamics with conditional random fields","author":"schmidt","year":"2011","journal-title":"ISMIR"},{"key":"ref18","first-page":"817","article-title":"Multi-class image segmentation using conditional random fields and global classification","author":"nils","year":"2009","journal-title":"Proceedings of the 26th Annual International Conference on Machine Learning"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2013.2248112"},{"key":"ref28","article-title":"Block-coordinate frank-wolfe optimization for structural svms","author":"lacoste-julien","year":"2012","journal-title":"arXiv preprint arXiv 1207 4747"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6287816"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853860"},{"key":"ref3","first-page":"337","article-title":"Separation of vocals from polyphonic audio recordings","author":"vembu","year":"2005","journal-title":"ISMIR"},{"key":"ref6","first-page":"427","article-title":"Low-rank representation of both singing voice and music accompaniment via learned dictionaries","author":"yang","year":"2013","journal-title":"ISMIR"},{"key":"ref29","article-title":"librosa: Audio and music signal analysis in python","author":"mcfee","year":"2015","journal-title":"14th annual Scientific Computing with Python conference"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2014.2329946"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.909260"},{"key":"ref7","first-page":"176","article-title":"Singing voice separation from monaural recordings","author":"li","year":"2006","journal-title":"ISMIR"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2004.832812"},{"key":"ref9","article-title":"Singing - voice separation from monaural recordings using deep recurrent neural networks","author":"huang","year":"2014","journal-title":"ISMIR"},{"key":"ref1","first-page":"243","article-title":"Singing voice separation for mono-channel music using nonnegative matrix factorization","author":"angkana","year":"2008","journal-title":"Advanced Technologies for Communications 2008 ATC 2008 International Conference"},{"article-title":"A tutorial on conditional random fields with applications to music analysis","year":"2013","author":"slim","key":"ref20"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"406","DOI":"10.21437\/Interspeech.2010-171","article-title":"Combining monaural and binaural evidence for reverberant speech segregation","author":"woodruff","year":"2010","journal-title":"InterSpeech"},{"key":"ref21","article-title":"Monaural segregation of voiced speech using discriminative random fields","author":"prabhavalkar","year":"2009","journal-title":"Tenth Annual Conference of the International Speech Communication Association"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/1970392.1970395"},{"key":"ref23","first-page":"1","article-title":"Ensemble learning for speech enhancement","author":"jonathan","year":"2013","journal-title":"Applications of Signal Processing to Audio and Acoustics (WASPAA) 2013 IEEE Workshop"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICSMC.1990.142050"},{"key":"ref25","article-title":"Harmonic\/percussive separation using median filtering","author":"fitzgerald","year":"2010","journal-title":"International Conference on Digital Audio Effects"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2016,3,20]]},"location":"Shanghai","end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07471715.pdf?arnumber=7471715","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,17]],"date-time":"2024-06-17T21:28:00Z","timestamp":1718659680000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7471715\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7471715","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}