{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T19:42:39Z","timestamp":1730230959063,"version":"3.28.0"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,5]]},"DOI":"10.1109\/icassp40776.2020.9053577","type":"proceedings-article","created":{"date-parts":[[2020,4,9]],"date-time":"2020-04-09T20:21:13Z","timestamp":1586463673000},"page":"7449-7453","source":"Crossref","is-referenced-by-count":6,"title":["Multi-Task Learning for Voice Trigger Detection"],"prefix":"10.1109","author":[{"given":"Siddharth","family":"Sigtia","sequence":"first","affiliation":[{"name":"Apple"}]},{"given":"Pascal","family":"Clark","sequence":"additional","affiliation":[{"name":"Apple"}]},{"given":"Rob","family":"Haynes","sequence":"additional","affiliation":[{"name":"Apple"}]},{"given":"Hywel","family":"Richards","sequence":"additional","affiliation":[{"name":"Apple"}]},{"given":"John","family":"Bridle","sequence":"additional","affiliation":[{"name":"Apple"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1662"},{"key":"ref11","article-title":"Convolutional Neural Networks for Small-Footprint Keyword Spotting","author":"sainath","year":"2015","journal-title":"Sixteenth Annual Conference of the International Speech Communication Association"},{"key":"ref12","article-title":"Convolutional Recurrent Neural Networks for Small-Footprint Keyword Spotting","author":"arik","year":"2017","journal-title":"TERSPEECH"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1766"},{"key":"ref14","article-title":"A Cascade Architecture for Keyword Spotting on Mobile Devices","author":"gruenstein","year":"2017","journal-title":"arXiv preprint arXiv 1712 03603"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462227"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143891"},{"key":"ref17","doi-asserted-by":"crossref","DOI":"10.23915\/distill.00008","article-title":"Sequence Modeling with CTC","author":"hannun","year":"2017","journal-title":"Distillation"},{"key":"ref18","article-title":"Online Keyword Spotting with a Character-level Recurrent Neural Network","author":"hwang","year":"2015","journal-title":"arXiv preprint arXiv 1512 00327"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"41","DOI":"10.1023\/A:1007379606734","article-title":"Multitask Learning","volume":"28","author":"caruana","year":"1997","journal-title":"Machine Learning"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854370"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2204"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-3006"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"252","DOI":"10.1109\/ASRU.2017.8268943","article-title":"Direct Modeling of Raw Audio with DNNs for Wake Word Detection","author":"kumatani","year":"2017","journal-title":"Automatic Speech Recognition and Understanding (ASRU) 2017 IEEE Workshop on"},{"key":"ref8","first-page":"220","article-title":"An Application of Recurrent Neural Networks to Discriminative Keyword Spotting","author":"fern\u00e1ndez","year":"2007","journal-title":"International Conference on Artificial Neural Networks"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1363"},{"year":"2017","key":"ref2","article-title":"Hey Siri: An On-device DNN-powered Voice Trigger for Apples Personal Assistant"},{"year":"2018","key":"ref1","article-title":"Optimizing Siri on HomePod in FarField Settings"},{"key":"ref9","article-title":"Streaming Small-Footprint Keyword Spotting using Sequence-to-Sequence Models","author":"he","year":"2017","journal-title":"Proc IEEE Workshop Automatic Speech Recognition and Understanding (ASRU)"},{"key":"ref20","first-page":"1223","article-title":"Large Scale Distributed Deep Networks","author":"dean","year":"2012","journal-title":"Advances in neural information processing systems"}],"event":{"name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2020,5,4]]},"location":"Barcelona, Spain","end":{"date-parts":[[2020,5,8]]}},"container-title":["ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9040208\/9052899\/09053577.pdf?arnumber=9053577","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T23:57:27Z","timestamp":1659484647000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9053577\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/icassp40776.2020.9053577","relation":{},"subject":[],"published":{"date-parts":[[2020,5]]}}}