{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T18:02:33Z","timestamp":1772906553080,"version":"3.50.1"},"reference-count":40,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2010,3,1]],"date-time":"2010-03-01T00:00:00Z","timestamp":1267401600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2010,3]]},"DOI":"10.1109\/tasl.2009.2025099","type":"journal-article","created":{"date-parts":[[2010,2,16]],"date-time":"2010-02-16T16:07:44Z","timestamp":1266336464000},"page":"434-446","source":"Crossref","is-referenced-by-count":24,"title":["Audio Signal Representations for Indexing in the Transform Domain"],"prefix":"10.1109","volume":"18","author":[{"given":"Emmanuel","family":"Ravelli","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ga\u00ebl","family":"Richard","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Laurent","family":"Daudet","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","author":"hainsworth","year":"2004","journal-title":"Techniques for the Automated Analysis of Musical Audio"},{"key":"ref38","year":"2008","journal-title":"FAAC and FAAD webpage"},{"key":"ref33","first-page":"92","article-title":"estimating the tonality of polyphonic audio files: cognitive versus machine learning modelling strategies","author":"gomez","year":"2004","journal-title":"Proc 5th ISMIR"},{"key":"ref32","first-page":"96","article-title":"musical key extraction from audio","author":"pauws","year":"2004","journal-title":"Proc 5th ISMIR"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2004.827951"},{"key":"ref30","year":"1995","journal-title":"Digital Audio Compression Standard (AC-3)"},{"key":"ref37","year":"2008","journal-title":"libMAD Mpeg audio decoder webpage"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.910786"},{"key":"ref35","first-page":"1","article-title":"improving timbre similarity: how high is the sky?","volume":"1","author":"pachet","year":"2004","journal-title":"J Negative Results Speech Audio Sci"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1980.1163420"},{"key":"ref10","first-page":"185","article-title":"chord segmentation and recognition using em-trained hidden markov models","author":"sheh","year":"2003","journal-title":"Proc Int Conf Music Inf Retrieval"},{"key":"ref40","article-title":"automatic chord identification using a quantized chromagram","author":"harte","year":"2005","journal-title":"Proc 118th AES Conv"},{"key":"ref11","first-page":"304","article-title":"a robust mid-level representation for harmonic content in music signals","author":"bello","year":"2005","journal-title":"Proc Int Conf Music Inf Retrieval"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.914399"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2002.800560"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-006-9019-7"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.909434"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"373","DOI":"10.1117\/12.234776","article-title":"audio characterization for video indexing","author":"patel","year":"1996","journal-title":"Proc SPIE"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/MMCS.1997.609787"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1999.757473"},{"key":"ref19","first-page":"2437","article-title":"content-based methods for the management of digital music","volume":"6","author":"pye","year":"2000","journal-title":"Proc IEEE Int Conf Acoust Speech Signal Process"},{"key":"ref28","year":"2008","journal-title":"Nero Aac Codec webpage"},{"key":"ref4","year":"1998","journal-title":"Report on the MPEG-2 AAC Stereo Verification Tests"},{"key":"ref27","year":"2008","journal-title":"LAME mp3 encoder webpage"},{"key":"ref3","year":"2001","journal-title":"Information technologyCoding of audio-visual objectsPart 3 Audio"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1076\/jnmr.30.1.39.7119"},{"key":"ref29","year":"2008","journal-title":"Apple iTunes 7 Webpage"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1121\/1.421129"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.885257"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.854090"},{"key":"ref2","year":"1998","journal-title":"Information TechnologyGeneric Coding of Moving Pictures and Associated Audio InformationPart 3 Audio"},{"key":"ref9","first-page":"464","article-title":"realtime chord recognition of musical sound: a system using common lisp music","author":"fujishima","year":"1999","journal-title":"Proc Int Comput Music Conf"},{"key":"ref1","year":"1992","journal-title":"Information TechnologyCoding of Moving Pictures and Associated Audio for Digital Storage Media at Up to About 1 5 Mbit\/sPart 3 Audio"},{"key":"ref20","first-page":"761","article-title":"sound analysis using mpeg compressed audio","volume":"2","author":"tzanetakis","year":"2000","journal-title":"Proc IEEE Int Conf Acoust Speech Signal Process"},{"key":"ref22","first-page":"261","article-title":"automatic music summarization in compressed domain","volume":"4","author":"shao","year":"2004","journal-title":"Proc IEEE Int Conf Acoust Speech Signal Process"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/500170.500172"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1162\/comj.2008.32.1.71"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.857573"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2008.2004290"},{"key":"ref25","author":"pfeiffer","year":"2001","journal-title":"Formalization of MPEG-1 compressed domain audio features"}],"container-title":["IEEE Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/10376\/5410050\/05410060.pdf?arnumber=5410060","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,10]],"date-time":"2021-10-10T23:51:17Z","timestamp":1633909877000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5410060\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,3]]},"references-count":40,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tasl.2009.2025099","relation":{},"ISSN":["1558-7916","1558-7924"],"issn-type":[{"value":"1558-7916","type":"print"},{"value":"1558-7924","type":"electronic"}],"subject":[],"published":{"date-parts":[[2010,3]]}}}