{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T21:43:16Z","timestamp":1778794996152,"version":"3.51.4"},"reference-count":39,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"9","license":[{"start":{"date-parts":[[2015,9,1]],"date-time":"2015-09-01T00:00:00Z","timestamp":1441065600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"DOI":"10.13039\/100000002","name":"National Institutes of Health and National Institute on Deafness and Other Communicative Disorders","doi-asserted-by":"publisher","award":["1R21DC012558"],"award-info":[{"award-number":["1R21DC012558"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health and National Institute on Deafness and Other Communicative Disorders","doi-asserted-by":"publisher","award":["2R01DC006859"],"award-info":[{"award-number":["2R01DC006859"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000006","name":"Office of Naval Research","doi-asserted-by":"publisher","award":["N000141410722"],"award-info":[{"award-number":["N000141410722"]}],"id":[{"id":"10.13039\/100000006","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE\/ACM Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2015,9]]},"DOI":"10.1109\/taslp.2015.2434213","type":"journal-article","created":{"date-parts":[[2015,5,15]],"date-time":"2015-05-15T18:58:25Z","timestamp":1431716305000},"page":"1421-1430","source":"Crossref","is-referenced-by-count":17,"title":["Convex Weighting Criteria for Speaking Rate Estimation"],"prefix":"10.1109","volume":"23","author":[{"family":"Yishan Jiao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Visar","family":"Berisha","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Ming Tu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Julie","family":"Liss","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1044\/1092-4388(2010\/09-0121)"},{"key":"ref38","first-page":"39","author":"miller","year":"1981","journal-title":"Perspectives on the Study of Speech"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1049\/ip-f-1.1980.0010"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1992.225858"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1080\/10556789908805766"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-84800-155-8_7"},{"key":"ref37","article-title":"Towards improving statistical model based voice activity detection","author":"tu","year":"2014","journal-title":"Proc Annu Conf Int Speech Commun Assoc"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/9780470043387"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/BF02943243"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.675368"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.wocn.2008.08.003"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1044\/2014_JSLHR-S-13-0149"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s10772-005-4760-z"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(00)00028-5"},{"key":"ref14","article-title":"Local speaking rate as a combination of syllable and phone rate","author":"pfitzinger","year":"1998","journal-title":"Proc ICSLP"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICSLP.1996.607256"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.675422"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1121\/1.380738"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.905178"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.3758\/BRM.41.2.385"},{"key":"ref28","article-title":"Statistical learning theory. 1998","author":"vapnik","year":"1998"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.3758\/BF03208147"},{"key":"ref27","author":"garofolo","year":"1993","journal-title":"TIMIT Acoustic-Phonetic Continuous Speech Corpus"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1044\/jshr.3601.41"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1044\/jshr.3805.1001"},{"key":"ref29","article-title":"CVX: Matlab software for disciplined convex programming, version 2.1","author":"grant","year":"2014"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/0093-934X(90)90106-Q"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1044\/1092-4388(2009\/08-0208)"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2007.02.006"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/5.628714"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"2079","DOI":"10.21437\/Eurospeech.1997-550","article-title":"Speech recognition using on-line estimation of speaking rate","volume":"97","author":"morgan","year":"1997","journal-title":"Eurospeech"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcomdis.2004.12.001"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960454"},{"key":"ref22","author":"mujumdar","year":"2006","journal-title":"Estimation of the Number of Syllables Using Hidden Markov Models and Design of A Dysarthria Classifier Using Global Statistics of Speech"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2000.861830"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638958"},{"key":"ref23","first-page":"145","article-title":"A new hybrid approach for automatic speech signal segmentation using silence signal detection, energy convex hull, and spectral variation","author":"zhao","year":"2008","journal-title":"Proc Conf Electr Comput Eng (CCECE)"},{"key":"ref26","first-page":"1324","article-title":"Learning to count objects in images","author":"lempitsky","year":"2010","journal-title":"Adv Neural Inf Process Syst"},{"key":"ref25","first-page":"1721","article-title":"Syllable detection and segmentation using temporal flow neural networks","author":"shastri","year":"1999","journal-title":"Proc 14th Int Congr Phon Sci"}],"container-title":["IEEE\/ACM Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6570655\/7118277\/07109110.pdf?arnumber=7109110","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,10]],"date-time":"2023-08-10T16:02:48Z","timestamp":1691683368000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7109110\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,9]]},"references-count":39,"journal-issue":{"issue":"9"},"URL":"https:\/\/doi.org\/10.1109\/taslp.2015.2434213","relation":{},"ISSN":["2329-9290","2329-9304"],"issn-type":[{"value":"2329-9290","type":"print"},{"value":"2329-9304","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,9]]}}}