{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T19:24:58Z","timestamp":1774898698363,"version":"3.50.1"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,5]]},"DOI":"10.1109\/icassp40776.2020.9052975","type":"proceedings-article","created":{"date-parts":[[2020,4,9]],"date-time":"2020-04-09T16:21:13Z","timestamp":1586449273000},"page":"3492-3496","source":"Crossref","is-referenced-by-count":37,"title":["SED-MDD: Towards Sentence Dependent End-To-End Mispronunciation Detection and Diagnosis"],"prefix":"10.1109","author":[{"given":"Yiqing","family":"Feng","sequence":"first","affiliation":[]},{"given":"Guanyu","family":"Fu","sequence":"additional","affiliation":[]},{"given":"Qingcai","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Kai","family":"Chen","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"Darpa timit acoustic-phonetic continous speech corpus cd-rom. nist speech disc 1-1.1","volume":"93","author":"garofolo","year":"1993","journal-title":"NASA STI\/Recon Technical Report N"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1110"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/0022-2836(70)90057-4"},{"key":"ref13","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref14","first-page":"448","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","author":"ioffe","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref15","author":"chung","year":"2014","journal-title":"arXiv preprint arXiv 1412 3555"},{"key":"ref16","article-title":"Tacotron: Towards end-to-end speech synthesis","author":"wang","year":"2017","journal-title":"arXiv preprint arXiv 1703 10593"},{"key":"ref17","first-page":"2773","article-title":"Grammar as a foreign language","author":"vinyals","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/29.46546"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462635"},{"key":"ref4","article-title":"Discriminative acoustic model for improving mispronunciation detection and diagnosis in computer-aided pronunciation training (capt)","author":"qian","year":"2010","journal-title":"Eleventh Annual Conference of the International Speech Communication Association"},{"key":"ref3","article-title":"Implementation of an extended recognition network for mispronunciation detection and diagnosis in computer-assisted pronunciation training","author":"harrison","year":"2009","journal-title":"International Workshop on Speech and Language Technology in Education"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2018.8486462"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461841"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8682654"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462562"},{"key":"ref2","article-title":"Automatic derivation of phonological rules for mispronunciation detection in a computer-assisted pronunciation training system effects with phonological rules","author":"lo","year":"2010","journal-title":"Eleventh Annual Conference of the International Speech Communication Association"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2016.2621675"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2007.4430152"},{"key":"ref20","first-page":"2554","article-title":"Unsupervised discovery of nonnative phonetic patterns in l2 english speech for mispronunciation detection and diagnosis","author":"li","year":"2018","journal-title":"Proceedings of the Annual Conference of the International Speech Communication Association INTERSPEECH"}],"event":{"name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Barcelona, Spain","start":{"date-parts":[[2020,5,4]]},"end":{"date-parts":[[2020,5,8]]}},"container-title":["ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9040208\/9052899\/09052975.pdf?arnumber=9052975","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T20:18:54Z","timestamp":1656361134000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9052975\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/icassp40776.2020.9052975","relation":{},"subject":[],"published":{"date-parts":[[2020,5]]}}}