{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T05:53:00Z","timestamp":1770529980656,"version":"3.49.0"},"reference-count":47,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE\/ACM Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/taslp.2023.3284523","type":"journal-article","created":{"date-parts":[[2023,6,13]],"date-time":"2023-06-13T17:21:10Z","timestamp":1686676870000},"page":"2437-2447","source":"Crossref","is-referenced-by-count":10,"title":["Multilingual Customized Keyword Spotting Using Similar-Pair Contrastive Learning"],"prefix":"10.1109","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7456-6486","authenticated-orcid":false,"given":"Lei","family":"Lei","sequence":"first","affiliation":[{"name":"Institute of Microelectronics, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Guoshun","family":"Yuan","sequence":"additional","affiliation":[{"name":"Institute of Microelectronics, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Hongjiang","family":"Yu","sequence":"additional","affiliation":[{"name":"Institute of Microelectronics, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Dewei","family":"Kong","sequence":"additional","affiliation":[{"name":"Institute of Microelectronics, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Yuefeng","family":"He","sequence":"additional","affiliation":[{"name":"Institute of Microelectronics, Chinese Academy of Sciences, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2007-174"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2009.5373341"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2009.5372889"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2009.5372931"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178970"},{"key":"ref6","article-title":"Donut: Ctc-based query-by-example keyword spotting","author":"Lugosch","year":"2018"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-1186"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICSP51882.2021.9408857"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1242"},{"key":"ref10","article-title":"Self-supervised audio representation learning for mobile devices","author":"Tagliasacchi","year":"2022"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9534474"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413528"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461684"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1846"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2017.2759726"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414156"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1310.4546"},{"key":"ref18","first-page":"9912","article-title":"Unsupervised learning of visual features by contrasting cluster assignments","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Caron","year":"2020"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.5555\/3524938.3525087"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.280"},{"key":"ref22","article-title":"Cert: Contrastive self-supervised learning for language understanding","author":"Fang","year":"2020"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.72"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7179087"},{"issue":"1","key":"ref25","first-page":"1","article-title":"Mel frequency cepstral coefficients for music modeling","volume-title":"Proc. Int. Symp. Music Inf. Retrieval","volume":"270","author":"Logan","year":"2000"},{"key":"ref26","article-title":"Rigid-motion scattering for texture classification","author":"Sifre","year":"2014"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICTA50426.2020.9332057"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.5555\/3045118.3045167"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00009"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-3015"},{"key":"ref33","article-title":"Rethinking attention with performers","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Choromanski","year":"2021"},{"key":"ref34","article-title":"Speech commands: A dataset for limited-vocabulary speech recognition","author":"Warden","year":"2018"},{"key":"ref35","article-title":"Jakobovski\/free-spoken-digit-dataset: V1.0.8","author":"Jackson","year":"2018"},{"key":"ref36","article-title":"Digit spoken hindi indianenglish","author":"Aiswarya","year":"2021"},{"key":"ref37","article-title":"kadazan digits","author":"Humayun","year":"2018"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1363"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2017.2657381"},{"key":"ref41","first-page":"8026","article-title":"Pytorch: An imperative style, high-performance deep learning library","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"32","author":"Paszke","year":"2019"},{"key":"ref42","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2014"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.21437\/Eurospeech.1997-504"},{"issue":"11","key":"ref45","article-title":"Visualizing data using t-sne journal of machine learning research","volume":"9","author":"Maaten","year":"2008","journal-title":"J. Mach. Learn. Res."},{"key":"ref46","first-page":"6105","article-title":"Efficientnet: Rethinking model scaling for convolutional neural networks","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tan","year":"2019"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.5555\/3495724.3497510"},{"key":"ref48","first-page":"9929","article-title":"Understanding contrastive representation learning through alignment and uniformity on the hypersphere","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Wang","year":"2020"}],"container-title":["IEEE\/ACM Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6570655\/9970249\/10149452.pdf?arnumber=10149452","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,12]],"date-time":"2024-04-12T06:37:24Z","timestamp":1712903844000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10149452\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":47,"URL":"https:\/\/doi.org\/10.1109\/taslp.2023.3284523","relation":{},"ISSN":["2329-9290","2329-9304"],"issn-type":[{"value":"2329-9290","type":"print"},{"value":"2329-9304","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}