{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,19]],"date-time":"2025-11-19T07:00:24Z","timestamp":1763535624106,"version":"3.28.0"},"reference-count":41,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,4]]},"DOI":"10.23919\/fruct.2019.8711906","type":"proceedings-article","created":{"date-parts":[[2019,5,13]],"date-time":"2019-05-13T23:07:46Z","timestamp":1557788866000},"page":"533-539","source":"Crossref","is-referenced-by-count":24,"title":["End-to-end Convolutional Neural Networks for Sound Event Detection in Urban Environments"],"prefix":"10.23919","author":[{"given":"Pablo","family":"Zinemanas","sequence":"first","affiliation":[]},{"given":"Pablo","family":"Cancela","sequence":"additional","affiliation":[]},{"given":"Martin","family":"Rocamora","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"journal-title":"Keras","year":"2015","author":"chollet","key":"ref39"},{"journal-title":"librosa 0 4 1","year":"2015","author":"mcfee","key":"ref38"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref32","article-title":"Very deep convolutional networks for large-scale image recognition","volume":"abs 1409 1556","author":"simonyan","year":"2014","journal-title":"CoRR"},{"key":"ref31","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in Neural Information Processing Systems 25"},{"key":"ref30","article-title":"Learning features of music from scratch","author":"thickstun","year":"2017","journal-title":"5th International Conference on Learning Representations - ICLR 2017"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2018.8489470"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2018.2878620"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953242"},{"key":"ref34","article-title":"Utilizing domain knowledge in end-to-end audio processing","author":"tax","year":"2017","journal-title":"Neural Information Processing Systems (NIPS) Conference"},{"key":"ref10","article-title":"Acoustic scene and event recognition using recurrent neural networks","author":"vu","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"journal-title":"B-cnn Branch convolutional neural network for hierarchical classification","year":"2017","author":"zhu","key":"ref40"},{"key":"ref11","article-title":"Dease 2016 sound event detection system based on convolutional neural network","author":"gorin","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"key":"ref12","article-title":"Sound event detection in multichannel audio LSTM network","author":"zhou","year":"2017","journal-title":"Tech Rep DCASE2016 Challenge"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8170052"},{"key":"ref14","article-title":"Audio event detection using multiple-input convolutional neural network","author":"jeong","year":"2017","journal-title":"Tech Rep DCASE2016 Challenge"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2690575"},{"key":"ref16","article-title":"A report on sound event detection with different binaural features","author":"adavanne","year":"2017","journal-title":"Detection and Classification of Acoustic Scenes and Events 2017"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"key":"ref18","article-title":"Experimentation on the dcase challenge 2016: Task 1 - acoustic scene classification and task 3 - sound event detection in real life audio","author":"elizalde","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"key":"ref19","article-title":"Deep neural network baseline for dcase challenge 2016","author":"kong","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854950"},{"key":"ref4","article-title":"The implementation of mems microphones for urban sound sensing","author":"mydlarz","year":"2014","journal-title":"Audio Engineering Society Convention 137"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.3390\/app8010150"},{"key":"ref3","first-page":"2345","article-title":"The design and calibration of low cost urban acoustic sensing devices","author":"charlie mydlarz","year":"2015","journal-title":"EuroNoise 2015 European Acoustics Association"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2655045"},{"key":"ref29","article-title":"End-to-end learning for music audio tagging at scale","author":"pons","year":"2018","journal-title":"19th ISMIR Conference"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7177954"},{"journal-title":"Computational Analysis of Sound Scenes and Events","year":"2017","author":"virtanen","key":"ref8"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2015.7362478"},{"key":"ref2","first-page":"243","article-title":"The sensor city initiative: cognitive sensors for soundscape transformations","author":"daniel steele","year":"2013","journal-title":"Geoinformatics for City Transformations Technical University of Ostrava"},{"key":"ref9","article-title":"Sound event detection in multichannel audio using spatial and harmonic features","author":"adavanne","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"journal-title":"Computational Analysis of Sound Scenes and Events","year":"2017","author":"bello","key":"ref1"},{"key":"ref20","article-title":"Sound Event Detection for Real Life Audio DCASE Challenge","author":"wei","year":"2016","journal-title":"Detection and Classification of Acoustic Scenes and Events 2016"},{"key":"ref22","article-title":"Bidirectional GRU for sound event detection","author":"lu","year":"2017","journal-title":"Tech Rep DCASE2016 Challenge"},{"key":"ref21","article-title":"Sound event detection from real-life audio by training a long short-term memory network with mono and stereo features","author":"wang","year":"2017","journal-title":"Tech Rep DCASE2016 Challenge"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2414"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.3390\/app6060162"},{"key":"ref23","article-title":"Acoustic modeling with deep neural networks using raw time signal for lvcsr","author":"tuske","year":"2014","journal-title":"INTER-SPEECH"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.21437\/Odyssey.2018-47"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-64680-0_5"}],"event":{"name":"2019 24th Conference of Open Innovations Association (FRUCT)","start":{"date-parts":[[2019,4,8]]},"location":"Moscow, Russia","end":{"date-parts":[[2019,4,12]]}},"container-title":["2019 24th Conference of Open Innovations Association (FRUCT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8700165\/8711873\/08711906.pdf?arnumber=8711906","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,3]],"date-time":"2019-06-03T23:45:35Z","timestamp":1559605535000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8711906\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,4]]},"references-count":41,"URL":"https:\/\/doi.org\/10.23919\/fruct.2019.8711906","relation":{},"subject":[],"published":{"date-parts":[[2019,4]]}}}