{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T20:05:48Z","timestamp":1776888348409,"version":"3.51.2"},"reference-count":47,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"5","license":[{"start":{"date-parts":[[2011,7,1]],"date-time":"2011-07-01T00:00:00Z","timestamp":1309478400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2011,7]]},"DOI":"10.1109\/tasl.2010.2090144","type":"journal-article","created":{"date-parts":[[2010,11,9]],"date-time":"2010-11-09T19:11:16Z","timestamp":1289329876000},"page":"1289-1300","source":"Crossref","is-referenced-by-count":7,"title":["Speaker Clustering Using Decision Tree-Based Phone Cluster Models With Multi-Space Probability Distributions"],"prefix":"10.1109","volume":"19","author":[{"given":"Han-Ping","family":"Shen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jui-Feng","family":"Yeh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chung-Hsien","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","article-title":"A comparative study of methods for phonetic decision-tree state clustering","author":"nock","year":"1998","journal-title":"Proc ICASSP'98"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1006\/csla.1995.0010"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.857809"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2015089"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1155\/S1110865704408026"},{"key":"ref30","first-page":"1","article-title":"Modelling pitch range variation within and across speakers: Predicting F0 targets when 'Speaking up'","author":"shriberg","year":"1996","journal-title":"Proc Int Conf Speech Lang Process"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ODYSSEY.2006.248109"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.852988"},{"key":"ref35","article-title":"Multi-space probability distribution HMM","volume":"e85 d","author":"tokuda","year":"2002","journal-title":"IEICE Trans Inf Syst"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2003.1202760"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3115\/1620853.1620871"},{"key":"ref40","first-page":"2099","article-title":"Simultaneous modeling of spectrum, pitch and state duration in HMM-based speech synthesis","volume":"j83 d ii","author":"yoshimura","year":"2000","journal-title":"IEICE Trans Inf Syst"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960527"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2008.4518624"},{"key":"ref13","first-page":"4369","article-title":"A novel speaker clustering algorithm via supervised affinity propagation","author":"zhang","year":"2008","journal-title":"Proc ICASSP'08"},{"key":"ref14","first-page":"305","article-title":"Segmental K-means initialization for SOM-based speaker clustering","author":"ben-harush","year":"2008","journal-title":"Proc 50th Int Symp ELMAR"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/MMSP.2008.4665062"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ISPACS.2006.364902"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2008.4607737"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-72847-4_71"},{"key":"ref19","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2008-3","article-title":"Agglomerative hierarchical speaker clustering using incremental Gaussian mixture cluster modeling","author":"han","year":"2008","journal-title":"Proc INTERSPEECH"},{"key":"ref28","first-page":"573","article-title":"Unknown-multiple speaker clustering using HMM","author":"ajmera","year":"2002","journal-title":"Proc Int Conf Spoken Lang Process (ICSLP)"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2004.1325995"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2008.05.004"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2006.1660194"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1993.319322"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/HIS.2009.14"},{"key":"ref5","article-title":"The Cambridge university March 2005 speaker diarisation system","author":"singha","year":"2005","journal-title":"Proc EUROSPEECH'05"},{"key":"ref8","first-page":"108","article-title":"Automatic speaker clustering","author":"jin","year":"1997","journal-title":"Proc DARPA Speech Recognition Workshop"},{"key":"ref7","article-title":"A robust unsupervised speaker clustering of speech utterances","author":"zhang","year":"2005","journal-title":"Proc NLP-KE"},{"key":"ref2","article-title":"Speaker diarization using bottom-up clustering based on a parameter-derived distance between adapted GMMs","author":"ben","year":"2004","journal-title":"Proc ICSLP'04"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.878256"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.878261"},{"key":"ref46","year":"2009","journal-title":"The 2009 (RT-09) Rich Transcription Meeting Recognition Evaluation Plan"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2007.4430121"},{"key":"ref45","doi-asserted-by":"crossref","first-page":"330","DOI":"10.1109\/TSA.2005.845820","article-title":"Speech act modeling and verification of spontaneous speech with disfluency in a spoken dialogue system","volume":"13","author":"wu","year":"2005","journal-title":"IEEE Trans Audio Speech Lang Process"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2007.894525"},{"key":"ref47","article-title":"The LIA-EURECOM RT'09 speaker diarization system","author":"fredouille","year":"2009","journal-title":"NIST Rich Transcription Workshop RT04"},{"key":"ref21","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2006-164","article-title":"Speaker cluster based GMM tokenization for speaker recognition","author":"ma","year":"2006","journal-title":"Proc INTERSPEECH"},{"key":"ref42","doi-asserted-by":"crossref","first-page":"36","DOI":"10.21437\/Interspeech.2008-7","article-title":"T-Test distance and clustering criterion for speaker diarization","author":"nguyen","year":"2008","journal-title":"Proc Interspeech'08"},{"key":"ref24","author":"benzeghiba","year":"2005","journal-title":"Speech and Speaker Recognition"},{"key":"ref41","first-page":"523","author":"rissanen","year":"1987","journal-title":"Encyclopedia of Statistical Sciences"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.3115\/1620853.1620871"},{"key":"ref44","first-page":"1025","article-title":"Purity algorithms for speaker diarization of meetings data","author":"wooters","year":"2006","journal-title":"Proc ICASSP '06"},{"key":"ref26","first-page":"-149i","article-title":"Gender-dependent phonetic refraction for speaker recognition","volume":"1","author":"andrews","year":"2003","journal-title":"Proc IEEE Int Conf Acoust Speech Signal Process (ICASSP'03)"},{"key":"ref43","first-page":"219","article-title":"MATBN&#x2014;A Mandarin Chinese broadcast news corpus","volume":"10","author":"wang","year":"2005","journal-title":"Comput Linguist Chinese Lang Process"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1990.115560"}],"container-title":["IEEE Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/10376\/5762410\/05613154.pdf?arnumber=5613154","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,11,13]],"date-time":"2021-11-13T08:56:46Z","timestamp":1636793806000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5613154\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,7]]},"references-count":47,"journal-issue":{"issue":"5"},"URL":"https:\/\/doi.org\/10.1109\/tasl.2010.2090144","relation":{},"ISSN":["1558-7916","1558-7924"],"issn-type":[{"value":"1558-7916","type":"print"},{"value":"1558-7924","type":"electronic"}],"subject":[],"published":{"date-parts":[[2011,7]]}}}