{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,8]],"date-time":"2025-10-08T22:23:22Z","timestamp":1759962202186,"version":"3.40.3"},"publisher-location":"Cham","reference-count":17,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030602758"},{"type":"electronic","value":"9783030602765"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-60276-5_50","type":"book-chapter","created":{"date-parts":[[2020,10,4]],"date-time":"2020-10-04T07:02:44Z","timestamp":1601794964000},"page":"520-529","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Recognition Performance of Selected Speech Recognition APIs \u2013 A Longitudinal Study"],"prefix":"10.1007","author":[{"given":"Ingo","family":"Siegert","sequence":"first","affiliation":[]},{"given":"Yamini","family":"Sinha","sequence":"additional","affiliation":[]},{"given":"Oliver","family":"Jokisch","sequence":"additional","affiliation":[]},{"given":"Andreas","family":"Wendemuth","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,9,29]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Chiu, C., et al.: State-of-the-art speech recognition with sequence-to-sequence models. In: Proceedings IEEE ICASSP-2018, Calgary, Kanada, April 2018, pp. 4774\u20134778 (2018)","key":"50_CR1","DOI":"10.1109\/ICASSP.2018.8462105"},{"doi-asserted-by":"publisher","unstructured":"Egorow, O., Lotz, A., Siegert, I., B\u00f6ck, R., Kr\u00fcger, J., Wendemuth, A.: Accelerating manual annotation of filled pauses by automatic pre-selection. In: 2017 International Conference on Companion Technology (ICCT), September 2017, pp. 1\u20136 (2017). \nhttps:\/\/doi.org\/10.1109\/COMPANION.2017.8287079","key":"50_CR2","DOI":"10.1109\/COMPANION.2017.8287079"},{"doi-asserted-by":"crossref","unstructured":"Godfrey, J.J., Holliman, E.C., McDaniel, J.: SWITCHBOARD: telephone speech corpus for research and development. In: Proceedings of the IEEE ICASSP-1992, San Francisco, CA, USA, March 1992, vol. 1, pp. 517\u2013520 (1992)","key":"50_CR3","DOI":"10.1109\/ICASSP.1992.225858"},{"key":"50_CR4","doi-asserted-by":"publisher","first-page":"17","DOI":"10.12948\/issn14531305\/23.1.2019.02","volume":"23","author":"B Iancu","year":"2019","unstructured":"Iancu, B.: Evaluating Google speech-to-text API\u2019s performance for Romanian e-Learning resources. Informatica Economica 23, 17\u201325 (2019). \nhttps:\/\/doi.org\/10.12948\/issn14531305\/23.1.2019.02","journal-title":"Informatica Economica"},{"unstructured":"Kim, J.Y., et al.: A comparison of online automatic speech recognition systems and the nonverbal responses to unintelligible speech. CoRR abs\/1904.12403 (2019). \nhttp:\/\/arxiv.org\/abs\/1904.12403","key":"50_CR5"},{"key":"50_CR6","series-title":"Smart Innovation, Systems and Technologies","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1007\/978-3-030-03748-2_13","volume-title":"Recent Advances in Intelligent Information Hiding and Multimedia Signal Processing","author":"T Kimura","year":"2019","unstructured":"Kimura, T., Nose, T., Hirooka, S., Chiba, Y., Ito, A.: Comparison of speech recognition performance between Kaldi and Google cloud speech API. In: Pan, J.-S., Ito, A., Tsai, P.-W., Jain, L.C. (eds.) IIH-MSP 2018. SIST, vol. 110, pp. 109\u2013115. Springer, Cham (2019). \nhttps:\/\/doi.org\/10.1007\/978-3-030-03748-2_13"},{"doi-asserted-by":"publisher","unstructured":"Kurata, G., Ramabhadran, B., Saon, G., Sethy, A.: Language modeling with highway LSTM. In: Proceedings of the IEEE ASRU, Okinana, Japan, pp. 244\u2013251 (2017). \nhttps:\/\/doi.org\/10.1109\/ASRU.2017.8268942","key":"50_CR7","DOI":"10.1109\/ASRU.2017.8268942"},{"doi-asserted-by":"publisher","unstructured":"K\u00ebpuska, V., Bohouta, G.: Comparing speech recognition systems (Microsoft API, Google API and CMU Sphinx). Int. J. Eng. Res. Appl. 20\u201324 (2017). \nhttps:\/\/doi.org\/10.9790\/9622-0703022024","key":"50_CR8","DOI":"10.9790\/9622-0703022024"},{"doi-asserted-by":"publisher","unstructured":"Och, F.J.: Minimum error rate training in statistical machine translation. In: Proceedings of the 41st Annual Meeting on Association for Computational Linguistics, pp. 160\u2013167. Association for Computational Linguistics, USA (2003). \nhttps:\/\/doi.org\/10.3115\/1075096.1075117","key":"50_CR9","DOI":"10.3115\/1075096.1075117"},{"unstructured":"Petrock, V.: US Voice Assistant Users 2019 - Who, What, Where and Why. eMarketer (2019). Accessed 15 July 2019","key":"50_CR10"},{"unstructured":"Roberts, M.: OK Google, Siri, Alexa, Cortana; can you tell me some stats on voice search? The edit blog (2018). Accessed 8 Jan 2018","key":"50_CR11"},{"doi-asserted-by":"publisher","unstructured":"Saon, G., et al.: English conversational telephone speech recognition by humans and machines. In: Proceedings of the INTERSPEECH-2017, Stockholm, Sweden, pp. 132\u2013136 (2017). \nhttps:\/\/doi.org\/10.21437\/Interspeech.2017-405","key":"50_CR12","DOI":"10.21437\/Interspeech.2017-405"},{"key":"50_CR13","first-page":"1693","volume":"6","author":"PA Sawakare","year":"2015","unstructured":"Sawakare, P.A., Deshmukh, R.R., Shrishrimal, P.P.: Speech recognition techniques: a review. Int. J. Sci. Eng. Res. 6, 1693\u20131698 (2015)","journal-title":"Int. J. Sci. Eng. Res."},{"unstructured":"Siegert, I.: \u201cAlexa in the wild\u201d - collecting unconstrained conversations with a modern voice assistant in a public environment. In: Proceedings of the 12th LREC, pp. 608\u2013612. ELRA, Marseille, France (2020). \nhttps:\/\/www.aclweb.org\/anthology\/2020.lrec-1.77","key":"50_CR14"},{"unstructured":"Siegert, I., Kr\u00fcger, J., Egorow, O., Nietzold, J., Heinemann, R., Lotz, A.: Voice Assistant Conversation Corpus (VACC): a multi-scenario dataset for addressee detection in human-computer-interaction using Amazon\u2019s ALEXA. In: Proceedings of the 11th LREC. ELRA, Paris, France (2018)","key":"50_CR15"},{"doi-asserted-by":"crossref","unstructured":"Xiong, W., Wu, L., Droppo, J., Huang, X., Stolcke, A.: The Microsoft 2017 conversational speech recognition system. In: Proceedings of the IEEE ICASSP-2018, Calgary, Kanada, April 2018, pp. 5934\u20135938 (2018)","key":"50_CR16","DOI":"10.1109\/ICASSP.2018.8461870"},{"doi-asserted-by":"crossref","unstructured":"Yurtcan, Y.: Performance evaluation of real-time noisy speech recognition for mobile devices. Master\u2019s thesis. Middle East Technical University, Turkey (2019)","key":"50_CR17","DOI":"10.1109\/SIU.2018.8404709"}],"container-title":["Lecture Notes in Computer Science","Speech and Computer"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-60276-5_50","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,10,4]],"date-time":"2020-10-04T07:13:31Z","timestamp":1601795611000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-60276-5_50"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030602758","9783030602765"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-60276-5_50","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"29 September 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"SPECOM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Speech and Computer","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"St. Petersburg","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Russia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 October 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 October 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"specom2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/specom.nw.ru\/2020\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"160","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"65","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"41% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Due to the Corona pandemic SPECOM 2020 was held as a virtual event","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}