{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T08:04:32Z","timestamp":1778313872489,"version":"3.51.4"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,4,14]]},"DOI":"10.1109\/icasspw62465.2024.10669909","type":"proceedings-article","created":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T18:23:22Z","timestamp":1725992602000},"page":"833-837","source":"Crossref","is-referenced-by-count":3,"title":["Leveraging Pre-Trained Autoencoders for Interpretable Prototype Learning of Music Audio"],"prefix":"10.1109","author":[{"given":"Pablo","family":"Alonso-Jim\u00e9nez","sequence":"first","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Leonardo","family":"Pepino","sequence":"additional","affiliation":[{"name":"Instituto de Investigaci&#x00F3;n en Ciencias de la Computaci&#x00F3;n (ICC), CONICET-UBA,Argentina"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Roser","family":"Batlle-Roca","sequence":"additional","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pablo","family":"Zinemanas","sequence":"additional","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dmitry","family":"Bogdanov","sequence":"additional","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xavier","family":"Serra","sequence":"additional","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mart\u00edn","family":"Rocamora","sequence":"additional","affiliation":[{"name":"Universitat Pompeu Fabra,Music Technology Group,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-70210-6_1"},{"key":"ref2","volume-title":"Interpretable Machine Learning","author":"Molnar","year":"2022"},{"key":"ref3","article-title":"Ethics Guidelines for Trustworthy AI","year":"2019"},{"key":"ref4","article-title":"Explainable artificial intelligence (XAI): Concepts, taxonomies, opportunities and challenges toward responsible AI","volume":"58","author":"Arrieta","year":"2020","journal-title":"Information Fusion"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/2967507"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.5334\/tismir.85"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.3390\/electronics10070850"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11771"},{"key":"ref9","article-title":"EnCodec-MAE: Leveraging neural codecs for universal audio representation learning","author":"Pepino","year":"2023"},{"key":"ref10","article-title":"The acousticbrainz genre dataset: Multi-source, multi-level, multi-label, and large-scale","volume-title":"Intl. Society for Music Information Retrieval (IS-MIR)","author":"Bogdanov","year":"2019"},{"key":"ref11","article-title":"Leveraging knowledge bases and parallel annotations for music genre translation","volume-title":"Intl. Society for Music Information Retrieval Conf. (ISMIR)","author":"Epure"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1076\/jnmr.32.1.83.16801"},{"key":"ref13","article-title":"Musical genre classification: Is it worth pursuing and how can it be improved?","volume-title":"Intl. Society for Music Information Retrieval (ISMIR)","author":"McKay","year":"2006"},{"key":"ref14","article-title":"How many beans make five? the consensus problem in music-genre classification and a new evaluation method for single-genre categorisation sysytems","volume-title":"Intl. Conf. on Music Information Retrieval (ISMIR)","author":"Craft"},{"key":"ref15","article-title":"The quest for musical genres: Do the experts and the wisdom of crowds agree?","volume-title":"Intl. Conf. on Music Information Retrieval (ISMIR)","author":"Sordo"},{"key":"ref16","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-12093-5_2","article-title":"A survey of evaluation in music genre recognition","volume-title":"Intl. Workshop on Adaptive Multimedia Retrieval","author":"Sturm"},{"key":"ref17","doi-asserted-by":"crossref","DOI":"10.21203\/rs.3.rs-3708077\/v1","article-title":"Transparency in music-generative AI: A systematic literature review","author":"Batlle-Roca","year":"2023"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854950"},{"key":"ref19","article-title":"Local interpretable model-agnostic explanations for music content analysis","volume-title":"Intl. Society for Music Information Retrieval Conf. (ISMIR)","author":"Mishra"},{"key":"ref20","article-title":"Toward interpretable music tagging with self-attention","author":"Won","year":"2019"},{"key":"ref21","article-title":"A model you can hear: Audio identification with playable prototypes","volume-title":"Intl. Conf. on Music Information Retrieval (ISMIR)","author":"Loiseau"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3129994"},{"key":"ref23","article-title":"High fidelity neural audio compression","author":"D\u00e9fossez","year":"2022"},{"key":"ref24","article-title":"High-fidelity audio compression with improved RVQGAN","author":"Kumar","year":"2023"},{"key":"ref25","article-title":"Deep convolutional networks on the pitch spiral for musical instrument recognition","volume-title":"Intl. Society for Music Information Retrieval Conf. (ISMIR)","author":"Lostanlen"},{"key":"ref26","article-title":"The GTZAN dataset: Its contents, its faults, their effects on evaluation, and its future use","author":"Sturm","year":"2013"},{"key":"ref27","article-title":"FMA: A dataset for music analysis","volume-title":"Intl. Society for Music Information Retrieval Conf. (ISMIR)","author":"Defferrard"},{"key":"ref28","article-title":"Progressive distillation for fast sampling of diffusion models","volume-title":"Intl. Conf. on Learning Representations (ICLR)","author":"Salimans"},{"key":"ref29","article-title":"Efficient supervised training of audio transformers for music representation learning","volume-title":"Intl. Society for Music Information Retrieval Conf. (ISMIR)","author":"Alonso-Jim\u00e9nez"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2019.2918992"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462046"}],"event":{"name":"2024 IEEE International Conference on Acoustics, Speech, and Signal Processing Workshops (ICASSPW)","location":"Seoul, Korea, Republic of","start":{"date-parts":[[2024,4,14]]},"end":{"date-parts":[[2024,4,19]]}},"container-title":["2024 IEEE International Conference on Acoustics, Speech, and Signal Processing Workshops (ICASSPW)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10625769\/10625780\/10669909.pdf?arnumber=10669909","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,11]],"date-time":"2024-09-11T17:29:37Z","timestamp":1726075777000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10669909\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,14]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/icasspw62465.2024.10669909","relation":{},"subject":[],"published":{"date-parts":[[2024,4,14]]}}}