{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T19:05:45Z","timestamp":1775329545855,"version":"3.50.1"},"publisher-location":"Singapore","reference-count":16,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819604333","type":"print"},{"value":"9789819604340","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-981-96-0434-0_23","type":"book-chapter","created":{"date-parts":[[2024,11,26]],"date-time":"2024-11-26T06:50:04Z","timestamp":1732603804000},"page":"325-332","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["A Pronunciation Practice System Based on\u00a0Pre-trained Deep Learning Models"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6801-1123","authenticated-orcid":false,"given":"Trang","family":"Phung","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-8317-2454","authenticated-orcid":false,"given":"Viet Dung","family":"Vu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4429-2343","authenticated-orcid":false,"given":"Tan-Ha","family":"Mai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,11,24]]},"reference":[{"key":"23_CR1","series-title":"CCIS","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/978-981-97-1711-8_6","volume-title":"TAAI 2023","author":"WC Cheng","year":"2024","unstructured":"Cheng, W.C., Mai, T.H., Lin, H.T.: From SMOTE to mixup for deep imbalanced classification. In: Lee, C.Y., Lin, C.L., Chang, H.T. (eds.) TAAI 2023. CCIS, vol. 2074, pp. 75\u201396. Springer, Singapore (2024). https:\/\/doi.org\/10.1007\/978-981-97-1711-8_6"},{"issue":"1","key":"23_CR2","first-page":"6884637","volume":"2022","author":"Z Cheng","year":"2022","unstructured":"Cheng, Z., Wang, Z.: Automatic scoring of spoken language based on basic deep learning. Sci. Program. 2022(1), 6884637 (2022)","journal-title":"Sci. Program."},{"key":"23_CR3","unstructured":"Devlin, J.: BERT: pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805 (2018)"},{"issue":"10","key":"23_CR4","doi-asserted-by":"publisher","first-page":"832","DOI":"10.1016\/j.specom.2009.04.005","volume":"51","author":"M Eskenazi","year":"2009","unstructured":"Eskenazi, M.: An overview of spoken language technology for education. Speech Commun. 51(10), 832\u2013844 (2009)","journal-title":"Speech Commun."},{"key":"23_CR5","doi-asserted-by":"crossref","unstructured":"Gulati, A., et\u00a0al.: Conformer: convolution-augmented transformer for speech recognition. arXiv preprint arXiv:2005.08100 (2020)","DOI":"10.21437\/Interspeech.2020-3015"},{"key":"23_CR6","doi-asserted-by":"crossref","unstructured":"Jiao, X., et al.: TinyBERT: distilling BERT for natural language understanding. arXiv preprint arXiv:1909.10351 (2019)","DOI":"10.18653\/v1\/2020.findings-emnlp.372"},{"key":"23_CR7","doi-asserted-by":"crossref","unstructured":"Nga, C.H., et\u00a0al.: Cyclic transfer learning for Mandarin-English code-switching speech recognition. IEEE Signal Process. Lett. (2023)","DOI":"10.1109\/LSP.2023.3307350"},{"key":"23_CR8","series-title":"LNDECT","doi-asserted-by":"publisher","first-page":"395","DOI":"10.1007\/978-3-030-97610-1_31","volume-title":"ICABDE 2021","author":"T Phung","year":"2022","unstructured":"Phung, T., Nguyen, V.T., Ma, T.H.T., Duc, Q.V.: A (2+1)D attention convolutional neural network for video prediction. In: Dang, N.H.T., Zhang, Y.D., Tavares, J.M.R.S., Chen, B.H. (eds.) ICABDE 2021. LNDECT, vol. 124, pp. 395\u2013406. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-030-97610-1_31"},{"key":"23_CR9","series-title":"CCIS","doi-asserted-by":"publisher","first-page":"682","DOI":"10.1007\/978-981-19-8069-5_48","volume-title":"FDSE 2022","author":"T Phung","year":"2022","unstructured":"Phung, T., Vu, D.Q., Mai-Tan, H., Nhung, L.T.: Deep models for mispronounce prediction for Vietnamese learners of English. In: Dang, T.K., K\u00fcng, J., Chung, T.M. (eds.) FDSE 2022. CCIS, vol. 1688, pp. 682\u2013689. Springer, Singapore (2022). https:\/\/doi.org\/10.1007\/978-981-19-8069-5_48"},{"key":"23_CR10","doi-asserted-by":"crossref","unstructured":"Tan, H.M., Vu, D.Q., Wang, J.C.: Selinet: a lightweight model for single channel speech separation. In: 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), ICASSP 2023, pp.\u00a01\u20135. IEEE (2023)","DOI":"10.1109\/ICASSP49357.2023.10097121"},{"key":"23_CR11","series-title":"LNNS","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1007\/978-3-031-50818-9_36","volume-title":"ICTA 2023","author":"HM Tan","year":"2024","unstructured":"Tan, H.M., Vu, D.Q., Thi, D.N., Thu, T.P.T.: Voice separation using multi learning on squash-norm embedding matrix and mask. In: Nghia, P.T., Thai, V.D., Thuy, N.T., Son, L.H., Huynh, V.N. (eds.) ICTA 2023. LNNS, vol. 848, pp. 327\u2013333. Springer, Cham (2024). https:\/\/doi.org\/10.1007\/978-3-031-50818-9_36"},{"key":"23_CR12","unstructured":"Vu, D.Q., Le, N.T., Wang, J.C.: Self-supervised learning via multi-transformation classification for action recognition. arXiv preprint arXiv:2102.10378 (2021)"},{"key":"23_CR13","doi-asserted-by":"crossref","unstructured":"Vu, D.Q., Phung, T.T., Wang, J.C., Mai, S.T.: LCSL: long-tailed classification via self-labeling. IEEE TCSVT (2024)","DOI":"10.1109\/TCSVT.2024.3421942"},{"issue":"8","key":"23_CR14","doi-asserted-by":"publisher","first-page":"3933","DOI":"10.1007\/s11760-023-02623-x","volume":"17","author":"DQ Vu","year":"2023","unstructured":"Vu, D.Q., Thu, T.P.T.: Simultaneous context and motion learning in video prediction. SIViP 17(8), 3933\u20133942 (2023)","journal-title":"SIViP"},{"key":"23_CR15","doi-asserted-by":"crossref","unstructured":"Vu, D.Q., Thu, T.P.T., Le, N., Wang, J.C., et\u00a0al.: Deep learning for human action recognition: a comprehensive review. APSIPA Trans. Signal Inf. Process. 12(2)","DOI":"10.1561\/116.00000068"},{"issue":"1","key":"23_CR16","first-page":"7186375","volume":"2022","author":"Y Xu","year":"2022","unstructured":"Xu, Y.: English speech recognition and evaluation of pronunciation quality using deep learning. Mob. Inf. Syst. 2022(1), 7186375 (2022)","journal-title":"Mob. Inf. Syst."}],"container-title":["Communications in Computer and Information Science","Future Data and Security Engineering. Big Data, Security and Privacy, Smart City and Industry 4.0 Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-0434-0_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,26]],"date-time":"2024-11-26T08:15:00Z","timestamp":1732608900000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-0434-0_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9789819604333","9789819604340"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-0434-0_23","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"24 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"FDSE","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Future Data and Security Engineering","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Binh Duong","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vietnam","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"fdse2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/thefdse.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}