{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T01:55:59Z","timestamp":1729648559780,"version":"3.28.0"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,7]]},"DOI":"10.1109\/spcom50965.2020.9179600","type":"proceedings-article","created":{"date-parts":[[2020,8,28]],"date-time":"2020-08-28T20:20:46Z","timestamp":1598646046000},"page":"1-5","source":"Crossref","is-referenced-by-count":5,"title":["End-to-end audio-scene classification from raw audio: Multi time-frequency resolution CNN architecture for efficient representation learning"],"prefix":"10.1109","author":[{"given":"T. Vijaya","family":"Kumar","sequence":"first","affiliation":[]},{"given":"R. Shunmuga","family":"Sundar","sequence":"additional","affiliation":[]},{"given":"Tilak","family":"Purohit","sequence":"additional","affiliation":[]},{"given":"V.","family":"Ramasubramanian","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"Learning environmental sounds with end-toend convolutional neural network","author":"tokozume","year":"2017","journal-title":"Proc ICASSP &#x2019;17"},{"key":"ref11","first-page":"220","article-title":"Sample-level deep convolutional neural networks for music auto-tagging using raw waveforms","author":"lee","year":"2016","journal-title":"Proceedings of the Sound and Music Computing Conference"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.3390\/app8010150"},{"key":"ref13","article-title":"Multi-temporal resolution convolutional neural networks for acoustic scene classification","author":"schindler","year":"2017","journal-title":"Detection and Classification of Acoustic Scenes and Events"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2018.8489641"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-00767-6_49"},{"key":"ref16","article-title":"Going Deeper with Convolutions","author":"szegedy","year":"2014","journal-title":"Proc CVPR"},{"key":"ref17","article-title":"Acoustic scene classification by ensemble of spectrograms based on adaptive temporal divisions","author":"sakashita","year":"2018","journal-title":"2018 Detection and Classification of Acoustic Scenes and Events"},{"year":"0","key":"ref18"},{"journal-title":"Proceedings of the Detection and Classification of Acoustic Scenes and Events 2018 Workshop (DCASE2018)","year":"2018","author":"plumbley","key":"ref19"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.50"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.4.541"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2339736"},{"key":"ref5","first-page":"8490","volume":"60","author":"krizhevsky","year":"2017","journal-title":"ImageNet Classification with Deep Convolutional Neural Networks"},{"key":"ref8","article-title":"Learning the speech front-end with raw waveform CLDNNs","author":"sainath","year":"2015","journal-title":"Proc of INTERSPEECH'15"},{"key":"ref7","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2015-3","article-title":"Analysis of CNN based speech recognition system using raw speech as input","author":"palaz","year":"2015","journal-title":"Proc Interspeech &#x2019;15"},{"year":"0","key":"ref2"},{"year":"0","key":"ref1"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952190"},{"journal-title":"Discrete Time Speech Signal Processing","year":"2002","author":"quatieri","key":"ref20"}],"event":{"name":"2020 International Conference on Signal Processing and Communications (SPCOM)","start":{"date-parts":[[2020,7,19]]},"location":"Bangalore, India","end":{"date-parts":[[2020,7,24]]}},"container-title":["2020 International Conference on Signal Processing and Communications (SPCOM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9176988\/9179490\/09179600.pdf?arnumber=9179600","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,10]],"date-time":"2022-11-10T22:51:25Z","timestamp":1668120685000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9179600\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/spcom50965.2020.9179600","relation":{},"subject":[],"published":{"date-parts":[[2020,7]]}}}