{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T12:29:15Z","timestamp":1761395355232,"version":"3.37.3"},"reference-count":55,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T00:00:00Z","timestamp":1559347200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T00:00:00Z","timestamp":1559347200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T00:00:00Z","timestamp":1559347200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"International Postgraduate Research Scholarship from the University of Western Australia"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2019,6]]},"DOI":"10.1109\/tmm.2018.2879750","type":"journal-article","created":{"date-parts":[[2018,11,5]],"date-time":"2018-11-05T19:25:20Z","timestamp":1541445920000},"page":"1359-1371","source":"Crossref","is-referenced-by-count":38,"title":["Auxiliary Classifier Generative Adversarial Network With Soft Labels in Imbalanced Acoustic Event Detection"],"prefix":"10.1109","volume":"21","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5277-6634","authenticated-orcid":false,"given":"Xianjun","family":"Xia","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3778-4633","authenticated-orcid":false,"given":"Roberto","family":"Togneri","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1557-4907","authenticated-orcid":false,"given":"Ferdous","family":"Sohel","sequence":"additional","affiliation":[]},{"given":"Defeng","family":"Huang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461845"},{"key":"ref38","first-page":"93","article-title":"Generative adversarial network based acoustic scene training set augmentation and selection using SVM hyper-plane","author":"mun","year":"0","journal-title":"Proc DCASE2017 Challenge"},{"article-title":"GANs trained by a two time-scale update rule converge to a Nash equilibrium","year":"2017","author":"heusel","key":"ref33"},{"key":"ref32","first-page":"2234","article-title":"Improved techniques for training GANs","author":"salimans","year":"0","journal-title":"Proc Int Conf Neural Inf Process"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8170052"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2017.2657381"},{"article-title":"Data augmentation in classification using GaN","year":"2017","author":"zhu","key":"ref37"},{"article-title":"Data augmentation generative adversarial networks","year":"2017","author":"antoniou","key":"ref36"},{"article-title":"Unsupervised representation learning with deep convolutional generative adversarial networks","year":"2015","author":"radford","key":"ref35"},{"article-title":"Conditional image synthesis with auxiliary classifier GaNs","year":"2016","author":"odena","key":"ref34"},{"article-title":"Large-scale weakly supervised audio classification using gated convolutional neural network","year":"2017","author":"xu","key":"ref28"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2482228"},{"article-title":"Deep convolutional neural networks and data augmentation for acoustic event detection","year":"2016","author":"takahashi","key":"ref29"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2014.2310706"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2014.2305632"},{"key":"ref20","first-page":"51","article-title":"Audio event detection using multiple-input convolutional neural network","author":"jeong","year":"0","journal-title":"Proc DCASE2017 Challenge"},{"key":"ref22","article-title":"A report on sound event detection with different binaural features","author":"adavanne","year":"0","journal-title":"Proc DCASE2017 Challenge"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"1291","DOI":"10.1109\/TASLP.2017.2690575","article-title":"Convolutional recurrent neural networks for polyphonic sound event detection","volume":"25","author":"parascandolo","year":"2017","journal-title":"IEEE\/ACM Trans Audio Speech Lang Process"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"354","DOI":"10.1016\/j.patcog.2017.10.013","article-title":"Recent advances in convolutional neural networks","volume":"77","author":"gu","year":"2017","journal-title":"Pattern Recognit"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"article-title":"Google's neural machine translation system: Bridging the gap between human and machine translation","year":"2016","author":"wu","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"article-title":"Stochastic backpropagation and approximate inference in deep generative models","year":"2014","author":"rezende","key":"ref50"},{"article-title":"Improving variational inference with inverse autoregressive flow","year":"2016","author":"kingma","key":"ref51"},{"key":"ref55","article-title":"DCASE 2017 challenge setup: Tasks, datasets and baseline system","author":"heittola","year":"0","journal-title":"Proc DCASE2017 Challenge"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.3390\/app6060162"},{"article-title":"Adam: A method for stochastic optimization","year":"2014","author":"kingma","key":"ref53"},{"key":"ref52","first-page":"807","article-title":"Rectified linear units improve restricted Boltzmann machines","author":"nair","year":"0","journal-title":"Proc 27th Int Conf Mach Learn"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2013.6701862"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472917"},{"article-title":"Conditional image synthesis with auxiliary classifier GANs","year":"2016","author":"odena","key":"ref40"},{"article-title":"Sound event detection in multichannel audio using spatial and harmonic features","year":"2017","author":"adavanne","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4959522"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2367814"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2017.8019418"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2017.8019452"},{"key":"ref17","article-title":"Acoustic event detection using signal enhancement and spectro-temporal feature extraction","author":"schr\u00f6der","year":"0","journal-title":"Proc IEEE Workshop Appl Signal Process Audio and Acoust"},{"key":"ref18","article-title":"Bidirectional GRU for sound event detection","author":"lu","year":"0","journal-title":"Proc DCASE2017 Challenge"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2016.2571999"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2428998"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-69568-4_29"},{"article-title":"A report on sound event detection with different binaural features","year":"2017","author":"adavanne","key":"ref6"},{"key":"ref5","article-title":"Proceedings of the detection and classification of acoustic scenes and events 2016 workshop","volume":"6","author":"virtanen","year":"0","journal-title":"Workshop on Detection and Classification of Acoustic Scenes and Events (DCASE)"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2476658"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2016.2572000"},{"article-title":"Auto-encoding variational Bayes","year":"2013","author":"kingma","key":"ref49"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2812605"},{"key":"ref46","first-page":"2672","article-title":"Generative adversarial nets","author":"goodfellow","year":"0","journal-title":"Proc Int Conf Neural Inf Process"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/s10479-005-5724-z"},{"article-title":"Unsupervised representation learning with deep convolutional generative adversarial networks","year":"2015","author":"radford","key":"ref48"},{"key":"ref47","first-page":"1486","article-title":"Deep generative image models using a Laplacian pyramid of adversarial networks","author":"denton","year":"0","journal-title":"Proc Int Conf Neural Inf Process"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2018.03.025"},{"key":"ref41","first-page":"1","article-title":"Automatic event classification using front end single channel noise reduction, MFCC features and a support vector machine classifier","author":"nogueira","year":"0","journal-title":"IEEE AASP Challenge Detection and Classification of Acoustic Scenes and Events"},{"key":"ref44","first-page":"55","article-title":"FrameCNN: A weakly-supervised learning framework for frame-wise acoustic event detection and classification","volume":"14","author":"chou","year":"2017","journal-title":"ReCALL"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2015.7280624"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/8720290\/08523637.pdf?arnumber=8523637","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,13]],"date-time":"2022-07-13T20:57:18Z","timestamp":1657745838000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8523637\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,6]]},"references-count":55,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tmm.2018.2879750","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"type":"print","value":"1520-9210"},{"type":"electronic","value":"1941-0077"}],"subject":[],"published":{"date-parts":[[2019,6]]}}}