{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:15:41Z","timestamp":1740100541731,"version":"3.37.3"},"reference-count":29,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T00:00:00Z","timestamp":1639353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T00:00:00Z","timestamp":1639353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003141","name":"CONACYT","doi-asserted-by":"publisher","award":["661687"],"award-info":[{"award-number":["661687"]}],"id":[{"id":"10.13039\/501100003141","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000858","name":"University of Sheffield","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100000858","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,12,13]]},"DOI":"10.1109\/asru51503.2021.9687993","type":"proceedings-article","created":{"date-parts":[[2022,2,3]],"date-time":"2022-02-03T20:31:00Z","timestamp":1643920260000},"page":"725-732","source":"Crossref","is-referenced-by-count":1,"title":["Attention Based Model for Segmental Pronunciation Error Detection"],"prefix":"10.1109","author":[{"given":"Jose Antonio Lopez","family":"Saenz","sequence":"first","affiliation":[{"name":"University of Sheffield,Speech and Hearing Research,Department of Computer Science,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Md Asif","family":"Jalal","sequence":"additional","affiliation":[{"name":"University of Sheffield,Speech and Hearing Research,Department of Computer Science,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rosanna","family":"Milner","sequence":"additional","affiliation":[{"name":"University of Sheffield,Speech and Hearing Research,Department of Computer Science,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Thomas","family":"Hain","sequence":"additional","affiliation":[{"name":"University of Sheffield,Speech and Hearing Research,Department of Computer Science,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2953"},{"key":"ref11","first-page":"598","article-title":"Lattice-based GOP in automatic pronunciation evaluation","volume":"3","author":"song","year":"0","journal-title":"2010 the 2nd International Conference on Computer and Automation Engineering ICCAE 2010"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCSN.2017.8230273"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1121\/1.5017834"},{"key":"ref14","first-page":"3062","article-title":"Recognize Mis-pronunciations to Improve Non-Nat&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;&#x00B7;ive Acoustic Modeling Through a Phone Decoder Built from One Edit Distance Finite State Automaton","author":"chu","year":"0","journal-title":"Proc Interspeech 2020"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-513"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462562"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.3390\/s20071809"},{"key":"ref18","first-page":"6234","article-title":"END-TO-END NEURAL NETWORK BASED AUTOMATED SPEECH SCORING Midea America Corporation, 250 W Tasman Dr, San Jose, CA 95134, USA Robert Bosch Corporation, 4005 Miranda Ave, Palo Alto, CA 94304, USA Educational Testing Service (ETS), 90 New Montgomer","author":"chen","year":"0","journal-title":"2018 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref19","first-page":"arxiv-2104","article-title":"A full text-dependent end to end mispronunciation detection and diagnosis with easy data augmentation techniques","author":"fu","year":"2021","journal-title":"ArXiv e-prints"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178993"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2017.12.006"},{"key":"ref27","first-page":"5999","article-title":"Attention is all you need","volume":"2017 december","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref3","first-page":"259","article-title":"Second language pronunciation assessment: A look at the present and the future","author":"trofimovich","year":"2016","journal-title":"Second Language Pronunciation Assessment Interdisciplinary Perspectives"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/PIC.2017.8359585"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1995.479278"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(99)00044-8"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/SLaTE.2019-6"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2363"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3758\/s13423-013-0519-8"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/SLaTE.2019-13"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2711"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2623"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952599"},{"journal-title":"Long short-term memory recurrent neural network architectures for large scale acoustic modeling","year":"2014","author":"sak","key":"ref21"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003838"},{"key":"ref23","first-page":"1","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"0","journal-title":"3rd International Conference on Learning Representations ICLR 2015 - Conference Track Proceedings"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref25","article-title":"Layer normalization","author":"ba","year":"2016","journal-title":"ArXiv Preprint"}],"event":{"name":"2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","start":{"date-parts":[[2021,12,13]]},"location":"Cartagena, Colombia","end":{"date-parts":[[2021,12,17]]}},"container-title":["2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9687821\/9687855\/09687993.pdf?arnumber=9687993","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,16]],"date-time":"2022-05-16T20:42:18Z","timestamp":1652733738000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9687993\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,12,13]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/asru51503.2021.9687993","relation":{},"subject":[],"published":{"date-parts":[[2021,12,13]]}}}