{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T16:02:16Z","timestamp":1730304136541,"version":"3.28.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1109\/waspaa52581.2021.9632708","type":"proceedings-article","created":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T16:12:28Z","timestamp":1639411948000},"page":"191-195","source":"Crossref","is-referenced-by-count":1,"title":["A Multi-Head Relevance Weighting Framework for Learning Raw Waveform Audio Representations"],"prefix":"10.1109","author":[{"given":"Debottam","family":"Dutta","sequence":"first","affiliation":[{"name":"Learning and Extraction of Acoustic Patterns (LEAP) Lab, Indian Institute of Science,Bangalore,560012"}]},{"given":"Purvi","family":"Agrawal","sequence":"additional","affiliation":[{"name":"Microsoft India Development Center,Hyderabad,India"}]},{"given":"Sriram","family":"Ganapathy","sequence":"additional","affiliation":[{"name":"Learning and Extraction of Acoustic Patterns (LEAP) Lab, Indian Institute of Science,Bangalore,560012"}]}],"member":"263","reference":[{"key":"ref32","first-page":"8024","article-title":"Pytorch: An imperative style, high-performance deep learning library","author":"paszke","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref31","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"0","journal-title":"Proc of ICLR"},{"key":"ref30","volume":"abs 2011 1447","author":"hu","year":"2020","journal-title":"A two-stage approach to device-robust acoustic scene classification"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1873"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2915167"},{"key":"ref12","article-title":"Leaf: A learnable frontend for audio classification","author":"zeghidour","year":"0","journal-title":"ICLRE"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.3030489"},{"key":"ref14","first-page":"3451","article-title":"Unsupervised raw waveform representation learning for ASR","year":"0","journal-title":"InterSpeech"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2019.2913965"},{"journal-title":"Neural representation learning for speech and audio signals","year":"2021","author":"agrawal","key":"ref16"},{"key":"ref17","first-page":"9","article-title":"A multi -device dataset for urban acoustic scene classification","author":"mesaros","year":"0","journal-title":"Proceedings of DCASE2018"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2655045"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2018.8639585"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053582"},{"key":"ref4","first-page":"1597","article-title":"A simple framework for contrastive learning of visual representations","author":"chen","year":"0","journal-title":"Proc of ICML"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2680"},{"key":"ref3","article-title":"Efficient estimation of word representations in vector space","author":"mikolov","year":"2013","journal-title":"ArXiv Preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.2307\/1417526"},{"key":"ref29","volume":"abs 1710 9412","author":"zhang","year":"2017","journal-title":"mixup Beyond empirical risk minimization"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707746"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2652"},{"key":"ref7","article-title":"Acoustic modeling with deep neural networks using raw time signal for LVCSR","author":"t\u00fcske","year":"0","journal-title":"Proc of Interspeech"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.50"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1121\/1.5001926"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","article-title":"Deep learning","volume":"521","author":"lecun","year":"2015","journal-title":"Nature"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178847"},{"key":"ref22","article-title":"Interpretable convolutional filters with SincNet","author":"ravanelli","year":"0","journal-title":"Proceedings of Neural Information Processing Systems (NIPS)"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462015"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1994.6.2.181"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1991.3.1.79"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053274"},{"key":"ref25","article-title":"Attention is all you need","volume":"abs 1706 3762","author":"vaswani","year":"2017","journal-title":"CoRR"}],"event":{"name":"2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","start":{"date-parts":[[2021,10,17]]},"location":"New Paltz, NY, USA","end":{"date-parts":[[2021,10,20]]}},"container-title":["2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9632687\/9632666\/09632708.pdf?arnumber=9632708","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T19:57:43Z","timestamp":1659470263000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9632708\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/waspaa52581.2021.9632708","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]}}}