{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T15:26:55Z","timestamp":1775230015842,"version":"3.50.1"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,12,16]],"date-time":"2023-12-16T00:00:00Z","timestamp":1702684800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,16]],"date-time":"2023-12-16T00:00:00Z","timestamp":1702684800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,12,16]]},"DOI":"10.1109\/asru57964.2023.10389666","type":"proceedings-article","created":{"date-parts":[[2024,1,19]],"date-time":"2024-01-19T13:38:40Z","timestamp":1705671520000},"page":"1-7","source":"Crossref","is-referenced-by-count":8,"title":["LibriSpeech-PC: Benchmark for Evaluation of Punctuation and Capitalization Capabilities of End-to-End ASR Models"],"prefix":"10.1109","author":[{"given":"Aleksandr","family":"Meister","sequence":"first","affiliation":[{"name":"NVIDIA,Yerevan,Armenia"}]},{"given":"Matvei","family":"Novikov","sequence":"additional","affiliation":[{"name":"NVIDIA,Yerevan,Armenia"}]},{"given":"Nikolay","family":"Karpov","sequence":"additional","affiliation":[{"name":"NVIDIA,Yerevan,Armenia"}]},{"given":"Evelina","family":"Bakhturina","sequence":"additional","affiliation":[{"name":"NVIDIA,Santa Clara,USA"}]},{"given":"Vitaly","family":"Lavrukhin","sequence":"additional","affiliation":[{"name":"NVIDIA,Santa Clara,USA"}]},{"given":"Boris","family":"Ginsburg","sequence":"additional","affiliation":[{"name":"NVIDIA,Santa Clara,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.iwslt-1.18"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-021-10051-x"},{"key":"ref3","article-title":"Robust speech recognition via large-scale weak supervision","author":"Radford","year":"2022","journal-title":"arXiv:2212.04356"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref5","article-title":"Can prosody aid the automatic processing of multiparty meetings? Evidence from predicting punctuation, disfluencies, and overlapping speech","volume-title":"Proceedings of the ITRW on Prosody in Speech Recognition and Understanding","author":"Shriberg"},{"key":"ref6","article-title":"Punctuation annotation using statistical prosody models","volume-title":"Proceedings of the ITRW on Prosody in Speech Recognition and Understanding","author":"Christensen"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2015-240"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1096"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/O-COCOSDA46868.2019.9041202"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-3074"},{"key":"ref11","article-title":"End to end ASR system with automatic punctuation insertion","author":"Guan","year":"2020","journal-title":"arXiv:2012.02012"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-5"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746366"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-3015"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/vl\/N19-142"},{"key":"ref16","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2015","journal-title":"ICLR"},{"key":"ref17","article-title":"Decoupled weight decay regularization","author":"Loshchilov","year":"2019","journal-title":"ICLR"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p18-1007"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-462"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-short.24"}],"event":{"name":"2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","location":"Taipei, Taiwan","start":{"date-parts":[[2023,12,16]]},"end":{"date-parts":[[2023,12,20]]}},"container-title":["2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10388490\/10389614\/10389666.pdf?arnumber=10389666","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,23]],"date-time":"2024-01-23T11:42:29Z","timestamp":1706010149000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10389666\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,16]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/asru57964.2023.10389666","relation":{},"subject":[],"published":{"date-parts":[[2023,12,16]]}}}