{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T07:35:53Z","timestamp":1776152153803,"version":"3.50.1"},"reference-count":40,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2009,1]]},"DOI":"10.1109\/tasl.2008.2006728","type":"journal-article","created":{"date-parts":[[2009,1,14]],"date-time":"2009-01-14T22:35:19Z","timestamp":1231972519000},"page":"2-12","source":"Crossref","is-referenced-by-count":17,"title":["Automatic Detection of Disfluency Boundaries in Spontaneous Speech of Children Using Audio&amp;#x2013;Visual Information"],"prefix":"10.1109","volume":"17","author":[{"given":"Serdar","family":"Yildirim","sequence":"first","affiliation":[]},{"given":"Shrikanth","family":"Narayanan","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1016\/S0031-3203(99)00138-7"},{"key":"ref38","author":"duda","year":"2001","journal-title":"Pattern Classification"},{"key":"ref33","first-page":"11","article-title":"disfluencies in switchboard","author":"shriberg","year":"1996","journal-title":"Proc ICSLP"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1006\/csla.1995.0002"},{"key":"ref31","first-page":"1841","article-title":"reference marking in childrens computer-directed speech: an integrated analysis of discourse and gesture","author":"montanari","year":"2004","journal-title":"Proc ICSLP"},{"key":"ref30","article-title":"analyzing the interplay between spoken language and gestural cues in conversational childmachine interactions in pre\/early literate age group","author":"montanari","year":"2004","journal-title":"Proc InStil"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1006\/anbe.2002.3015"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/34.368151"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/BF01420984"},{"key":"ref34","first-page":"901","article-title":"srilman extensible language modeling toolkit","volume":"2","author":"stolcke","year":"2002","journal-title":"Proc ICSLP"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/89.985544"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1023\/A:1022859003006"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1996.541104"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1998.674460"},{"key":"ref13","article-title":"childrens speech recognition with application to interactive books and tutors","author":"hagen","year":"2003","journal-title":"Proc IEEE ASRU Workshop"},{"key":"ref14","first-page":"2337","article-title":"an analysis of the causes of increased error rated in children's speech recognition","author":"li","year":"2002","journal-title":"Proc ICSLP"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"319","DOI":"10.7551\/mitpress\/2697.003.0014","author":"oviatt","year":"2000","journal-title":"Embodied Conversational Agents"},{"key":"ref16","first-page":"525","article-title":"a multi-pass linear fold algorithm for sentence boundary detection using prosodic cues","volume":"1","author":"wang","year":"2004","journal-title":"Proc ICASSP"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1075\/gest.1.1.03mcn"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/568513.568514"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.905145"},{"key":"ref28","author":"boersma","year":"2005","journal-title":"?Praat Doing Phonetics by Computer ?"},{"key":"ref4","author":"shriberg","year":"1994","journal-title":"Preliminaries to a theory of speech disfluencies"},{"key":"ref27","first-page":"197","article-title":"cu animate tools for enabling conversations with animated characters","volume":"1","author":"ma","year":"2002","journal-title":"Proc ICSLP"},{"key":"ref3","first-page":"206","article-title":"automatic detection and classification of disfluent reading miscues in young childrens speech for the purpose of assessment","author":"black","year":"2007","journal-title":"Proc InterSpeech ICSLP"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"2383","DOI":"10.21437\/Eurospeech.1997-626","article-title":"a prosody-only decision-tree model for disfluency detection","author":"shriberg","year":"1997","journal-title":"Proc EUROSPEECH"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"1367","DOI":"10.21437\/Eurospeech.2001-354","article-title":"anvila generic annotation tool for multimodal dialogue","author":"kipp","year":"2001","journal-title":"Proc EUROSPEECH"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1996.541118"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"957","DOI":"10.21437\/Eurospeech.2003-332","article-title":"automatic disfluency identification in conversational speech using multiple knowledge source","author":"liu","year":"2003","journal-title":"Proc EUROSPEECH"},{"key":"ref7","first-page":"2247","article-title":"automatic detection of sentence boundaries and disfluencies based on recognized words","author":"stolcke","year":"1998","journal-title":"Proc ICSLP"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3115\/1220355.1220537"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1121\/1.426686"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"3165","DOI":"10.21437\/Eurospeech.2003-791","article-title":"evaluating the effect of predicting oral reading miscues","author":"banerjee","year":"2003","journal-title":"Proc EUROSPEECH"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.885910"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.3115\/1073012.1073028"},{"key":"ref21","article-title":"analysis of speech and gesture frequency during fluent and hesitant phases in speech","author":"valbonesi","year":"2002","journal-title":"Proc 6th Multi-Conf Syst Cybern Inf (SCI 2002)"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2004.840590"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICMI.2002.1166985"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-005-0466-3"},{"key":"ref25","first-page":"121","article-title":"multimodal model integration for sentence unit detection","author":"chen","year":"2004","journal-title":"Proc ICMI"}],"container-title":["IEEE Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/10376\/4740138\/04740159.pdf?arnumber=4740159","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,9]],"date-time":"2024-03-09T01:48:29Z","timestamp":1709948909000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/4740159\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,1]]},"references-count":40,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/tasl.2008.2006728","relation":{},"ISSN":["1558-7916"],"issn-type":[{"value":"1558-7916","type":"print"}],"subject":[],"published":{"date-parts":[[2009,1]]}}}