{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T16:08:01Z","timestamp":1772726881220,"version":"3.50.1"},"reference-count":19,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8462062","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:24:48Z","timestamp":1537568688000},"page":"2491-2495","source":"Crossref","is-referenced-by-count":13,"title":["Eventness: Object Detection on Spectrograms for Temporal Localization of Audio Events"],"prefix":"10.1109","author":[{"given":"Phuong","family":"Pham","sequence":"first","affiliation":[]},{"given":"Juncheng","family":"Li","sequence":"additional","affiliation":[]},{"given":"Joseph","family":"Szurley","sequence":"additional","affiliation":[]},{"given":"Samarjit","family":"Das","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"1","article-title":"An exemplar-based NMF approach to audio event detection","author":"gemmeke","year":"2013","journal-title":"Proc of the IEEE Workshop on Applications of Signal Process to Audio and Acoustics (WASPAA)"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2367814"},{"key":"ref12","article-title":"Learning environmental sounds with end-to-end convolutional neural network","author":"tokozume","year":"2017","journal-title":"IEEE SigPort"},{"key":"ref13","first-page":"1041","article-title":"A dataset and taxonomy for urban sound research","volume":"2014","author":"salamon","year":"0","journal-title":"Proc ACM Int Conf Multimedia (ACM MM)"},{"key":"ref14","article-title":"DCASE 2017 challenge setup: tasks, datasets and baseline system","author":"mesaros","year":"2017","journal-title":"Proc of the Detection and Classification of Acoustic Scenes and Events Workshop (DCASE)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2010.2100380"},{"key":"ref16","article-title":"Fast R-CNN","author":"girshick","year":"2015","journal-title":"Proc of the Int Conf on Computer Vision (ICCV)"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"key":"ref18","article-title":"Audio set: An ontology and human-labeled dataset for audio events","author":"gemmeke","year":"2017","journal-title":"Proc of the IEEE Int Conf on Acoustics Speech and Signal Process (ICASSP)"},{"key":"ref19","first-page":"2017","article-title":"Spatial transformer networks","author":"jaderberg","year":"2015","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref4","first-page":"779","article-title":"You only look once: Unified, real-time object detection","author":"redmon","year":"2016","journal-title":"Proc of the IEEE Conf on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref3","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","author":"ren","year":"2015","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref6","first-page":"1","article-title":"Environmental sound classification with convolutional neural networks","author":"piczak","year":"2015","journal-title":"Proc of the IEEE Int Workshop on Machine Learning for Signal Process (MLSP)"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-805"},{"key":"ref8","first-page":"1","article-title":"Polyphonic sound event detection using multi label deep neural networks","author":"cakir","year":"2015","journal-title":"Proc of the IEEE Int Joint Conf on Neural Networks (IJCNN)"},{"key":"ref7","first-page":"3704","article-title":"A bag-of-features approach to acoustic event detection","author":"plinge","year":"2014","journal-title":"Proc of the IEEE Int Conf on Acoustics Speech and Signal Process (ICASSP)"},{"key":"ref2","article-title":"Scalable, high-quality object detection","author":"szegedy","year":"2015","journal-title":"Tech Rep"},{"key":"ref1","first-page":"580","article-title":"Rich feature hierarchies for accurate object detection and semantic segmentation","author":"girshick","year":"2014","journal-title":"Proc of the IEEE Conf on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref9","first-page":"1267","article-title":"Acoustic event detection in real life recordings","author":"mesaros","year":"2010","journal-title":"Proc of European Signal Process Conf"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Calgary, AB","start":{"date-parts":[[2018,4,15]]},"end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08462062.pdf?arnumber=8462062","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,24]],"date-time":"2020-08-24T05:31:46Z","timestamp":1598247106000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8462062\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":19,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8462062","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}