{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T20:43:49Z","timestamp":1761597829218,"version":"3.28.0"},"reference-count":34,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,3]]},"DOI":"10.1109\/icassp.2017.7952133","type":"proceedings-article","created":{"date-parts":[[2017,6,20]],"date-time":"2017-06-20T17:35:36Z","timestamp":1497980136000},"page":"136-140","source":"Crossref","is-referenced-by-count":8,"title":["CNN-LTE: A class of 1-X pooling convolutional neural networks on label tree embeddings for audio scene classification"],"prefix":"10.1109","author":[{"given":"Huy","family":"Phan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Philipp","family":"Koch","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lars","family":"Hertel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Marco","family":"Maass","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Radoslaw","family":"Mazur","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alfred","family":"Mertins","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587756"},{"year":"0","key":"ref32"},{"key":"ref31","first-page":"1","article-title":"Adam: a method for stochastic optimization","author":"kingma","year":"2015","journal-title":"Proc of the Int Conf on Learning Representations (ICLR)"},{"key":"ref30","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"Journal of Machine Learning Research (JMLR)"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2015.7362846"},{"key":"ref10","first-page":"142","article-title":"Histogram of gradients of time-frequency representations for audio scene classification","volume":"23","author":"rakotomamonjy","year":"2015","journal-title":"IEEE\/ACM Trans Audio Speech and Language Processing"},{"key":"ref11","first-page":"107","article-title":"Noise-robust environmental sound classification method based on combination of ICA and MP features","volume":"2","author":"mogi","year":"2013","journal-title":"Artificial Intelligence Research"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1121\/1.2750160"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2013.6701893"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472918"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2967268"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.854103"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2017438"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2015.7362358"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/2766462.2767830"},{"key":"ref4","first-page":"1272","article-title":"Audio context recognition using audio event histogram","author":"heittola","year":"2010","journal-title":"Proc EUSIPCO"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1181"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2014.2326181"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6855206"},{"key":"ref29","first-page":"111","article-title":"A theoretical analysis of feature pooling in visual recognition","author":"boureau","year":"2010","journal-title":"Proc ICML"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2008.921739"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2013.6701890"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806389"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2428998"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2012.2199972"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/9780470043387"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1023\/A:1010933404324"},{"key":"ref22","first-page":"3441","article-title":"Representing nonspeech audio signals through speech classification models","author":"phan","year":"2015","journal-title":"Proc INTERSPEECH"},{"journal-title":"Gammatone-like Spectrograms","year":"2009","author":"ellis","key":"ref21"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/89.928915"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2367814"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-123"},{"key":"ref25","first-page":"315","article-title":"Deep sparse rectifier neural networks","author":"glorot","year":"2011","journal-title":"Proc Int Conf Artificial Intelligence and Statistics (AISTATS)"}],"event":{"name":"2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2017,3,5]]},"location":"New Orleans, LA","end":{"date-parts":[[2017,3,9]]}},"container-title":["2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7943262\/7951776\/07952133.pdf?arnumber=7952133","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,8,29]],"date-time":"2017-08-29T14:46:15Z","timestamp":1504017975000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7952133\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,3]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/icassp.2017.7952133","relation":{},"subject":[],"published":{"date-parts":[[2017,3]]}}}