{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T20:18:04Z","timestamp":1778271484331,"version":"3.51.4"},"publisher-location":"Cham","reference-count":17,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032253040","type":"print"},{"value":"9783032253057","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-25305-7_23","type":"book-chapter","created":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T19:58:41Z","timestamp":1778270321000},"page":"331-338","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["The Effect of\u00a0Perceptual Metrics on\u00a0Music Representation Learning for\u00a0Genre Classification"],"prefix":"10.1007","author":[{"given":"Tashi","family":"Namgyal","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alexander","family":"Hepburn","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Raul","family":"Santos-Rodriguez","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Valero","family":"Laparra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jesus","family":"Malo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,5,9]]},"reference":[{"key":"23_CR1","unstructured":"Barlow, H.B.: Possible principles underlying the transformation of sensory messages. Sensory Communication, pp. 217\u2013234 (1961)"},{"issue":"4","key":"23_CR2","doi-asserted-by":"publisher","first-page":"532","DOI":"10.1109\/TCOM.1983.1095851","volume":"31","author":"P Burt","year":"1983","unstructured":"Burt, P., Adelson, E.: The laplacian pyramid as a compact image code. IEEE Trans. Commun. 31(4), 532\u2013540 (1983)","journal-title":"IEEE Trans. Commun."},{"key":"23_CR3","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhou, X., Chen, H.: Audio scanning network: Bridging time and frequency domains for audio classification. In: Proceedings of the AAAI Conference on Artificial Intelligence 38(10), pp. 11355\u201311363 (2024)","DOI":"10.1609\/aaai.v38i10.29015"},{"key":"23_CR4","unstructured":"Clifford, M.: mattclifford1\/iqm-vis: Zenodo1. Zenodo (2024). https:\/\/doi.org\/10.5281\/zenodo.13759721"},{"key":"23_CR5","doi-asserted-by":"crossref","unstructured":"Hepburn, A., Laparra, V., McConville, R., Santos-Rodriguez, R.: Enforcing perceptual consistency on generative adversarial networks by using the normalised laplacian pyramid distance. In: Proc. Northern Lights Deep Learning Workshop (NLDL) (2020)","DOI":"10.7557\/18.5124"},{"key":"23_CR6","unstructured":"Hepburn, A., Laparra, V., Santos-Rodriguez, R., Ball\u00e9, J., Malo, J.: On the relation between statistical learning and perceptual distances. In: Proc. Int. Conf. Learning Representations (ICLR) (2022)"},{"issue":"16","key":"23_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2352\/ISSN.2470-1173.2016.16.HVEI-103","volume":"2016","author":"V Laparra","year":"2016","unstructured":"Laparra, V., Ball\u00e9, J., Berardino, A., Simoncelli, E.P.: Perceptual image quality assessment using a normalized laplacian pyramid. Electronic Imaging 2016(16), 1\u20136 (2016)","journal-title":"Electronic Imaging"},{"issue":"12","key":"23_CR8","doi-asserted-by":"publisher","first-page":"3179","DOI":"10.1162\/NECO_a_00046","volume":"22","author":"J Malo","year":"2010","unstructured":"Malo, J., Laparra, V.: Psychophysically tuned divisive normalization approximately factorizes the pdf of natural images. Neural Comput. 22(12), 3179\u20133206 (2010)","journal-title":"Neural Comput."},{"key":"23_CR9","unstructured":"Namgyal, T., Hepburn, A., Santos-Rodriguez, R., Laparra, V., Malo, J.: What you hear is what you see: audio quality from image quality metrics. In: Proc. Int. Conf. Digital Audio Effects (DAFx) (2023)"},{"key":"23_CR10","unstructured":"Namgyal, T., Hepburn, A., Santos-Rodriguez, R., Laparra, V., Malo, J.: Data is overrated: perceptual metrics can lead learning in the absence of training data. arXiv preprint arXiv:2312.03455 (2023)"},{"issue":"8","key":"23_CR11","doi-asserted-by":"publisher","first-page":"819","DOI":"10.1038\/90526","volume":"4","author":"O Schwartz","year":"2001","unstructured":"Schwartz, O., Simoncelli, E.P.: Natural signal statistics and sensory gain control. Nat. Neurosci. 4(8), 819\u2013825 (2001)","journal-title":"Nat. Neurosci."},{"issue":"2","key":"23_CR12","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1080\/09298215.2014.894533","volume":"43","author":"BL Sturm","year":"2014","unstructured":"Sturm, B.L.: The state of the art ten years after a state of the art: Future research in music information retrieval. J. New Music Res. 43(2), 147\u2013172 (2014)","journal-title":"J. New Music Res."},{"key":"23_CR13","unstructured":"Tzanetakis, G., Essl, G., Cook, P.: Automatic musical genre classification of audio signals. In: International Symposium on Music Information Retrieval (ISMIR) (2001)"},{"key":"23_CR14","unstructured":"Vinay, A., Lerch, A.: Evaluating generative audio systems and their metrics. In: Proc. Int. Soc. Music Information Retrieval (ISMIR) (2022)"},{"key":"23_CR15","unstructured":"Wang, Z., Simoncelli, E.P., Bovik, A.C.: Multiscale structural similarity for image quality assessment. In: Asilomar Conf. Signals, Systems & Computers (2003)"},{"issue":"4","key":"23_CR16","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE Trans. Image Process. 13(4), 600\u2013612 (2004)","journal-title":"IEEE Trans. Image Process."},{"issue":"2","key":"23_CR17","doi-asserted-by":"publisher","first-page":"1025","DOI":"10.1152\/physrev.00011.2022","volume":"103","author":"BDB Willmore","year":"2023","unstructured":"Willmore, B.D.B., King, A.J.: Adaptation in auditory processing. Physiol. Rev. 103(2), 1025\u20131058 (2023)","journal-title":"Physiol. Rev."}],"container-title":["Communications in Computer and Information Science","Machine Learning and Principles and Practice of Knowledge Discovery in Databases"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-25305-7_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T19:58:43Z","timestamp":1778270323000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-25305-7_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9783032253040","9783032253057"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-25305-7_23","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"9 May 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Funding"}},{"value":"ECML PKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vilnius","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Lithuania","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecml2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2024.ecmlpkdd.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}