{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:42:51Z","timestamp":1742913771659,"version":"3.40.3"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030200541"},{"type":"electronic","value":"9783030200558"}],"license":[{"start":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T00:00:00Z","timestamp":1556668800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-20055-8_26","type":"book-chapter","created":{"date-parts":[[2019,4,30]],"date-time":"2019-04-30T13:16:38Z","timestamp":1556630198000},"page":"273-280","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Prototypical Metric Transfer Learning for Continuous Speech Keyword Spotting with Limited Training Data"],"prefix":"10.1007","author":[{"given":"Harshita","family":"Seth","sequence":"first","affiliation":[]},{"given":"Pulkit","family":"Kumar","sequence":"additional","affiliation":[]},{"given":"Muktabh Mayank","family":"Srivastava","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,5,1]]},"reference":[{"key":"26_CR1","doi-asserted-by":"crossref","unstructured":"Sainath, T.N., Parada, C.: Convolutional neural networks for small-footprint keyword spotting. In: Interspeech (2015)","DOI":"10.21437\/Interspeech.2015-352"},{"key":"26_CR2","unstructured":"Tang, R., Lin, J.: Honk: a PyTorch reimplementation of convolutional neural networks for keyword spotting. arXiv preprint arXiv:1710.06554 , 18 October 2017"},{"key":"26_CR3","unstructured":"Hannun, A., Case, C., Casper, J., Catanzaro, B., Diamos, G., Elsen, E., Prenger, R., Satheesh, S., Sengupta, S., Coates, A., Ng, A.Y.: Deep speech: scaling up end-to-end speech recognition. arXiv preprint arXiv:1412.5567 , 17 December 2014"},{"key":"26_CR4","unstructured":"Snell, J., Swersky, K., Zemel, R.: Prototypical networks for few-shot learning. In: Advances in Neural Information Processing Systems, pp. 4077\u20134087 (2017)"},{"key":"26_CR5","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/978-3-319-24261-3_7","volume-title":"Similarity-Based Pattern Recognition","author":"Elad Hoffer","year":"2015","unstructured":"Hoffer, E., Ailon, N.: Deep metric learning using triplet network. In: International Workshop on Similarity-Based Pattern Recognition, vol. 12, pp. 84\u201392. Springer, Cham (2015)"},{"key":"26_CR6","doi-asserted-by":"crossref","unstructured":"Weintraub, M.: Keyword-spotting using SRI\u2019s DECIPHER large-vocabulary speech-recognition system. In: 1993 IEEE International Conference on Acoustics, Speech, and Signal Processing 1993, ICASSP 1993, vol. 2, pp. 463\u2013466. IEEE, 27 April 1993","DOI":"10.1109\/ICASSP.1993.319341"},{"issue":"11","key":"26_CR7","doi-asserted-by":"publisher","first-page":"1870","DOI":"10.1109\/29.103088","volume":"38","author":"JG Wilpon","year":"1990","unstructured":"Wilpon, J.G., Rabiner, L.R., Lee, C.H., Goldman, E.R.: Automatic recognition of keywords in unconstrained speech using hidden Markov models. IEEE Transact. Acoust. Speech Sig. Proc. 38(11), 1870\u20131878 (1990)","journal-title":"IEEE Transact. Acoust. Speech Sig. Proc."},{"key":"26_CR8","unstructured":"Rose, R.C., Paul, D.B.: A hidden Markov model based keyword recognition system. In: 1990 International Conference on Acoustics, Speech, and Signal Processing 1990, ICASSP 1990, pp. 129\u2013132. IEEE, 3 April 1990"},{"issue":"4","key":"26_CR9","first-page":"665","volume":"18","author":"J Nouza","year":"2009","unstructured":"Nouza, J., Silovsky, J.: Fast keyword spotting in telephone speech. Radioengineering 18(4), 665\u201370 (2009)","journal-title":"Radioengineering"},{"key":"26_CR10","unstructured":"Lee, H., Pham, P., Largman, Y., Ng, A.Y.: Unsupervised feature learning for audio classification using convolutional deep belief networks. In: Advances in Neural Information Processing Systems, pp. 1096\u20131104 (2009)"},{"issue":"1","key":"26_CR11","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1109\/TASL.2011.2109382","volume":"20","author":"AR Mohamed","year":"2012","unstructured":"Mohamed, A.R., Dahl, G.E., Hinton, G.: Acoustic modeling using deep belief networks. IEEE Trans. Audio Speech Lang. Process. 20(1), 14\u201322 (2012)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"26_CR12","unstructured":"Grosse, R., Raina, R., Kwong, H., Ng, A.Y.: Shift-invariance sparse coding for audio classification. arXiv preprint arXiv:1206.5241 , 20 June 2012"},{"issue":"6","key":"26_CR13","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","volume":"29","author":"G Hinton","year":"2012","unstructured":"Hinton, G., Deng, L., Yu, D., Dahl, G.E., Mohamed, A.R., Jaitly, N., Senior, A., Vanhoucke, V., Nguyen, P., Sainath, T.N., Kingsbury, B.: Deep neural networks for acoustic modeling in speech recognition: the shared views of four research groups. IEEE Signal Process. Mag. 29(6), 82\u201397 (2012)","journal-title":"IEEE Signal Process. Mag."},{"issue":"1","key":"26_CR14","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1109\/TASL.2011.2134090","volume":"20","author":"GE Dahl","year":"2012","unstructured":"Dahl, G.E., Yu, D., Deng, L., Acero, A.: Context-dependent pre-trained deep neural networks for large-vocabulary speech recognition. IEEE Transact. Audio Speech Lang. Process. 20(1), 30\u201342 (2012)","journal-title":"IEEE Transact. Audio Speech Lang. Process."},{"key":"26_CR15","doi-asserted-by":"crossref","unstructured":"Li, K.P., Naylor, J.A., Rossen, M.L.: A whole word recurrent neural network for keyword spotting. In: 1992 IEEE International Conference on Acoustics, Speech, and Signal Processing 1992, ICASSP 1992, vol. 2, pp. 81\u201384. IEEE, 23 March 1992","DOI":"10.1109\/ICASSP.1992.226115"},{"key":"26_CR16","first-page":"220","volume-title":"Lecture Notes in Computer Science","author":"Santiago Fern\u00e1ndez","year":"2007","unstructured":"Fern\u00e1ndez, S., Graves, A., Schmidhuber, J.: An application of recurrent neural networks to discriminative keyword spotting. In: International Conference on Artificial Neural Networks, vol. 9, pp. 220\u2013229. Springer, Heidelberg, September 2007"},{"key":"26_CR17","doi-asserted-by":"crossref","unstructured":"Chen, G., Parada, C., Heigold, G.: Small-footprint keyword spotting using deep neural networks. In: ICASSP, vol. 14, pp. 4087\u20134091, 4 May 2014","DOI":"10.1109\/ICASSP.2014.6854370"},{"key":"26_CR18","doi-asserted-by":"crossref","unstructured":"Pons, J., Serr\u00e1, J., Serra, X.: Training neural audio classifiers with few data. arXiv preprint arXiv:1810.10274 , 24 October 2018","DOI":"10.1109\/ICASSP.2019.8682591"},{"key":"26_CR19","unstructured":"Vinyals, O., Blundell, C., Lillicrap, T., Wierstra, D.: Matching networks for one shot learning. In: Advances in Neural Information Processing Systems, pp. 3630\u20133638 (2016)"},{"key":"26_CR20","doi-asserted-by":"crossref","unstructured":"Kunze, J., Kirsch, L., Kurenkov, I., Krug, A., Johannsmeier, J., Stober, S.: Transfer learning for speech recognition on a budget. arXiv preprint arXiv:1706.00290 , 1 June 2017","DOI":"10.18653\/v1\/W17-2620"},{"key":"26_CR21","unstructured":"Choi, K., Fazekas, G., Sandler, M., Cho, K.: Transfer learning for music classification and regression tasks. arXiv preprint arXiv:1703.09179 , 27 March 2017"},{"key":"26_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"26_CR23","unstructured":"Honk: A PyTorch Reimplementation of Convolutional Neural Networks for Keyword Spotting. https:\/\/github.com\/castorini\/honk"},{"key":"26_CR24","unstructured":"Rohlicek, J.R., Russell, W., Roukos, S., Gish, H.: Continuous hidden Markov modeling for speaker-independent word spotting. In: 1989 International Conference on Acoustics, Speech, and Signal Processing 1989, ICASSP 1989, pp. 627\u2013630. IEEE, 23 May 1989"},{"key":"26_CR25","doi-asserted-by":"crossref","unstructured":"Wilpon, J.G., Miller, L.G., Modi, P.: Improvements and applications for key word recognition using hidden Markov modeling techniques. In: 1991 International Conference on Acoustics, Speech, and Signal Processing 1991, ICASSP 1991, pp. 309\u2013312. IEEE, 14 April 1991","DOI":"10.1109\/ICASSP.1991.150338"},{"key":"26_CR26","unstructured":"Silaghi, M.C., Bourlard, H.: Iterative posterior-based keyword spotting without filler models. In: Proceedings of the IEEE Automatic Speech Recognition and Understanding Workshop, pp. 213\u2013216, 12 December 1999"}],"container-title":["Advances in Intelligent Systems and Computing","14th International Conference on Soft Computing Models in Industrial and Environmental Applications (SOCO 2019)"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-20055-8_26","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,17]],"date-time":"2022-09-17T04:50:51Z","timestamp":1663390251000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-20055-8_26"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,5,1]]},"ISBN":["9783030200541","9783030200558"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-20055-8_26","relation":{},"ISSN":["2194-5357","2194-5365"],"issn-type":[{"type":"print","value":"2194-5357"},{"type":"electronic","value":"2194-5365"}],"subject":[],"published":{"date-parts":[[2019,5,1]]},"assertion":[{"value":"1 May 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"SOCO","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Workshop on Soft Computing Models in Industrial and Environmental Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Seville","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2019","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 May 2019","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 May 2019","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"socomoin2019","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/2019.sococonference.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}