{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T19:12:09Z","timestamp":1743102729322,"version":"3.40.3"},"publisher-location":"Cham","reference-count":35,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031270765"},{"type":"electronic","value":"9783031270772"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-27077-2_27","type":"book-chapter","created":{"date-parts":[[2023,3,28]],"date-time":"2023-03-28T05:03:10Z","timestamp":1679979790000},"page":"345-357","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Music Instrument Classification Reprogrammed"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3406-741X","authenticated-orcid":false,"given":"Hsin-Hung","family":"Chen","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6319-578X","authenticated-orcid":false,"given":"Alexander","family":"Lerch","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,29]]},"reference":[{"key":"27_CR1","unstructured":"Benetos, E., Kotti, M., Kotropoulos, C.: Musical instrument classification using non-negative matrix factorization algorithms and subset feature selection. In: ICASSP (2006)"},{"key":"27_CR2","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1016\/j.patcog.2018.07.023","volume":"84","author":"B Biggio","year":"2018","unstructured":"Biggio, B., Roli, F.: Wild patterns: ten years after the rise of adversarial machine learning. Pattern Recognit. 84, 317\u2013331 (2018)","journal-title":"Pattern Recognit."},{"key":"27_CR3","unstructured":"Bittner, R.M., Salamon, J., Tierney, M., Mauch, M., Cannam, C., Bello, J.P.: Medleydb: a multitrack dataset for annotation-intensive MIR research. In: ISMIR (2014)"},{"key":"27_CR4","unstructured":"Bosch, J.J., Janer, J., Fuhrmann, F., Herrera, P.: A comparison of sound segregation techniques for predominant instrument recognition in musical audio signals. In: ISMIR (2012)"},{"key":"27_CR5","unstructured":"Choi, K., Fazekas, G., Sandler, M.B., Cho, K.: Transfer learning for music classification and regression tasks. In: ISMIR (2017)"},{"issue":"6","key":"27_CR6","doi-asserted-by":"publisher","first-page":"1293","DOI":"10.1109\/JAS.2019.1911747","volume":"6","author":"HA Dau","year":"2019","unstructured":"Dau, H.A., et al.: The UCR time series archive. IEEE\/CAA J. Automatica Sinica 6(6), 1293\u20131305 (2019)","journal-title":"IEEE\/CAA J. Automatica Sinica"},{"key":"27_CR7","unstructured":"Defferrard, M., Benzi, K., Vandergheynst, P., Bresson, X.: FMA: a dataset for music analysis. In: ISMIR (2017)"},{"key":"27_CR8","unstructured":"Elsayed, G.F., Goodfellow, I., Sohl-Dickstein, J.: Adversarial reprogramming of neural networks. In: ICLR (2019)"},{"key":"27_CR9","unstructured":"Eronen, A., Klapuri, A.: Musical instrument recognition using cepstral coefficients and temporal features. In: ICASSP (2000)"},{"key":"27_CR10","unstructured":"Essid, S., Richard, G., David, B.: Hierarchical classification of musical instruments on solo recordings. In: ICASSP (2006)"},{"key":"27_CR11","doi-asserted-by":"crossref","unstructured":"Gemmeke, J.F., et al.: Audio set: an ontology and human-labeled dataset for audio events. In: ICASSP (2017)","DOI":"10.1109\/ICASSP.2017.7952261"},{"key":"27_CR12","doi-asserted-by":"crossref","unstructured":"Gong, Y., Chung, Y.A., Glass, J.R.: AST: Audio spectrogram transformer. In: Interspeech (2021)","DOI":"10.21437\/Interspeech.2021-698"},{"key":"27_CR13","doi-asserted-by":"crossref","unstructured":"Gong, Y., Lai, C.I., Chung, Y.A., Glass, J.R.: SSAST: self-supervised audio spectrogram transformer. In: AAAI (2021)","DOI":"10.21437\/Interspeech.2021-698"},{"key":"27_CR14","unstructured":"Gururani, S., Lerch, A.: Mixing secrets: a multi-track dataset for instrument recognition in polyphonic music. In: ISMIR (2017)"},{"key":"27_CR15","doi-asserted-by":"crossref","unstructured":"Gururani, S., Lerch, A.: Semi-supervised audio classification with partially labeled data. In: IEEE ISM (2021)","DOI":"10.1109\/ISM52913.2021.00027"},{"key":"27_CR16","unstructured":"Gururani, S., Sharma, M., Lerch, A.: An attention mechanism for musical instrument recognition. In: ISMIR (2019)"},{"key":"27_CR17","doi-asserted-by":"crossref","unstructured":"Hambardzumyan, K., Khachatrian, H., May, J.: WARP: word-level adversarial ReProgramming. In: IJCNLP (2021)","DOI":"10.18653\/v1\/2021.acl-long.381"},{"key":"27_CR18","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"27_CR19","doi-asserted-by":"crossref","unstructured":"Hershey, S., et al.: CNN architectures for large-scale audio classification. In: ICASSP (2017)","DOI":"10.1109\/ICASSP.2017.7952132"},{"key":"27_CR20","unstructured":"Howard, A.G., et al.: Mobilenets: efficient convolutional neural networks for mobile vision applications. In: CVPR (2017)"},{"key":"27_CR21","unstructured":"Humphrey, E., Durand, S., McFee, B.: Openmic-2018: an open data-set for multiple instrument recognition. In: ISMIR (2018)"},{"key":"27_CR22","doi-asserted-by":"crossref","unstructured":"Hung, Y., Yang, Y.: Frame-level instrument recognition by timbre and pitch. In: ISMIR (2018)","DOI":"10.1109\/ICASSP.2019.8683426"},{"key":"27_CR23","unstructured":"Jansson, A., Humphrey, E.J., Montecchio, N., Bittner, R.M., Kumar, A., Weyde, T.: Singing voice separation with deep u-net convolutional networks. In: ISMIR (2017)"},{"key":"27_CR24","doi-asserted-by":"crossref","unstructured":"Kong, Q., Cao, Y., Iqbal, T., Wang, Y., Wang, W., Plumbley, M.D.: PANNs: large-scale pretrained audio neural networks for audio pattern recognition. In: IEEE\/ACM Transactions on Audio, Speech, and Language Processing (2020)","DOI":"10.1109\/TASLP.2020.3030497"},{"key":"27_CR25","unstructured":"Li, P.Q., Qian, J., Wang, T.: Automatic instrument recognition in polyphonic music using convolutional neural networks. CoRR abs\/1511.05520 (2015)"},{"key":"27_CR26","unstructured":"Lostanlen, V., Cella, C.E.: Deep convolutional networks on the pitch spiral for music instrument recognition. In: ISMIR (2016)"},{"key":"27_CR27","doi-asserted-by":"crossref","unstructured":"Nagawade, M.S., Ratnaparkhe, V.R.: Musical instrument identification using MFCC. In: RTEIC) (2017)","DOI":"10.1109\/RTEICT.2017.8256990"},{"key":"27_CR28","doi-asserted-by":"crossref","unstructured":"Neekhara, P., Hussain, S., Dubnov, S., Koushanfar, F.: Adversarial reprogramming of text classification neural networks. In: EMNLP-IJCNLP (2019)","DOI":"10.18653\/v1\/D19-1525"},{"key":"27_CR29","doi-asserted-by":"crossref","unstructured":"Piczak, K.J.: ESC: Dataset for Environmental Sound Classification. In: ACM MM, pp. 1015\u20131018. ACM (2015)","DOI":"10.1145\/2733373.2806390"},{"key":"27_CR30","unstructured":"Pons, J., Serra, X.: MusiCNN: pre-trained convolutional neural networks for music audio tagging. In: ISMIR (2019)"},{"key":"27_CR31","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1007\/978-3-319-24574-4_28","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Navab, N., Hornegger, J., Wells, W.M., Frangi, A.F. (eds.) MICCAI 2015. LNCS, vol. 9351, pp. 234\u2013241. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28"},{"key":"27_CR32","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"270","DOI":"10.1007\/978-3-030-01424-7_27","volume-title":"Artificial Neural Networks and Machine Learning \u2013 ICANN 2018","author":"C Tan","year":"2018","unstructured":"Tan, C., Sun, F., Kong, T., Zhang, W., Yang, C., Liu, C.: A survey on deep transfer learning. In: K\u016frkov\u00e1, V., Manolopoulos, Y., Hammer, B., Iliadis, L., Maglogiannis, I. (eds.) ICANN 2018. LNCS, vol. 11141, pp. 270\u2013279. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01424-7_27"},{"key":"27_CR33","unstructured":"Tsai, Y.Y., Chen, P.Y., Ho, T.Y.: Transfer learning without knowing: reprogramming black-box machine learning models with scarce data and limited resources. In: ICML. PMLR (2020)"},{"key":"27_CR34","unstructured":"Warden, P.: Speech commands: a dataset for limited-vocabulary speech recognition. CoRR abs\/1804.03209 (2018)"},{"key":"27_CR35","unstructured":"Yang, C.H.H., Tsai, Y.Y., Chen, P.Y.: Voice2series: reprogramming acoustic models for time series classification. In: ICML. PMLR (2021)"}],"container-title":["Lecture Notes in Computer Science","MultiMedia Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-27077-2_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,3,28]],"date-time":"2023-03-28T05:13:56Z","timestamp":1679980436000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-27077-2_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031270765","9783031270772"],"references-count":35,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-27077-2_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"29 March 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"MMM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Multimedia Modeling","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bergen","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Norway","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 January 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 January 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"mmm2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Conftool Pro","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"267","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"86","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"32% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}