{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T22:11:45Z","timestamp":1743027105266,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":16,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642250842"},{"type":"electronic","value":"9783642250859"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-3-642-25085-9_66","type":"book-chapter","created":{"date-parts":[[2011,11,11]],"date-time":"2011-11-11T15:03:34Z","timestamp":1321023814000},"page":"557-564","source":"Crossref","is-referenced-by-count":3,"title":["Improvements on Automatic Speech Segmentation at the Phonetic Level"],"prefix":"10.1007","author":[{"given":"Jon Ander","family":"G\u00f3mez","sequence":"first","affiliation":[]},{"given":"Marcos","family":"Calvo","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"issue":"6","key":"66_CR1","doi-asserted-by":"publisher","first-page":"617","DOI":"10.1109\/TSA.2003.813579","volume":"11","author":"D.T. Toledano","year":"2003","unstructured":"Toledano, D.T., Hern\u00e1ndez G\u00f3mez, L., Villarrubia Grande, L.: Automatic Phonetic Segmentation. IEEE Transactions on Speech and Audio Processing\u00a011(6), 617\u2013625 (2003)","journal-title":"IEEE Transactions on Speech and Audio Processing"},{"key":"66_CR2","doi-asserted-by":"crossref","unstructured":"Kipp, A., Wesenick, M.B., Schiel, F.: Pronunciation modelling applied to automatic segmentation of spontaneous speech. In: Proceedings of Eurospeech, Rhodes, Greece, pp. 2013\u20132026 (1997)","DOI":"10.21437\/Eurospeech.1997-358"},{"key":"66_CR3","doi-asserted-by":"crossref","unstructured":"Sethy, A., Narayanan, S.: Refined Speech Segmentation for Concatenative Speech Synthesis. In: Proceedings of ICSLP, Denver, Colorado, USA, pp. 149\u2013152 (2002)","DOI":"10.21437\/ICSLP.2002-89"},{"key":"66_CR4","doi-asserted-by":"crossref","unstructured":"Jarify, S., Pastor, D., Rosec, O.: Cooperation between global and local methods for the automatic segmentation of speech synthesis corpora. In: Proceedings of Interspeech, Pittsburgh, Pennsylvania, USA, pp. 1666\u20131669 (2006)","DOI":"10.21437\/Interspeech.2006-464"},{"key":"66_CR5","doi-asserted-by":"crossref","unstructured":"Romsdorfer, H., Pfister, B.: Phonetic Labeling and Segmentation of Mixed-Lingual Prosody Databases. In: Proceedings of Interspeech, Lisbon, Portual, pp. 3281\u20133284 (2005)","DOI":"10.21437\/Interspeech.2005-572"},{"key":"66_CR6","doi-asserted-by":"crossref","unstructured":"Paulo, S., Oliveira, L.C.: DTW-based Phonetic Alignment Using Multiple Acoustic Features. In: Proceedings of Eurospeech, Geneva, Switzerland, pp. 309\u2013312 (2003)","DOI":"10.21437\/Eurospeech.2003-126"},{"key":"66_CR7","doi-asserted-by":"crossref","unstructured":"Park, S.S., Shin, J.W., Kim, N.S.: Automatic Speech Segmentation with Multiple Statistical Models. In: Proceedings of Interspeech, Pittsburgh, Pennsylvania, USA, pp. 2066\u20132069 (2006)","DOI":"10.21437\/Interspeech.2006-406"},{"key":"66_CR8","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1016\/j.csl.2009.04.004","volume":"24","author":"I. Mporas","year":"2010","unstructured":"Mporas, I., Ganchev, T., Fakotakis, N.: Speech segmentation using regression fusion of boundary predictions. Computer Speech and Language\u00a024, 273\u2013288 (2010)","journal-title":"Computer Speech and Language"},{"key":"66_CR9","doi-asserted-by":"crossref","unstructured":"Povey, D., Woodland, P.C.: Minimum Phone Error and I-smoothing for improved discriminative training. In: Proceedings of ICASSP, Orlando, Florida, USA, pp. 105\u2013108 (2002)","DOI":"10.1109\/ICASSP.2002.1005687"},{"key":"66_CR10","doi-asserted-by":"crossref","unstructured":"Kuo, J.W., Wang, H.M.: Minimum Boundary Error Training for Automatic Phonetic Segmentation. In: Proceedings of Interspeech, Pittsburgh, Pennsylvania, USA, pp. 1217\u20131220 (2006)","DOI":"10.1007\/11939993_43"},{"key":"66_CR11","doi-asserted-by":"crossref","unstructured":"Huggins-Daines, D., Rudnicky, A.I.: A Constrained Baum-Welch Algorithm for Improved Phoneme Segmentation and Efficient Training. In: Proceedings of Interspeech, Pittsburgh, Pennsylvania, USA, pp. 1205\u20131208 (2006)","DOI":"10.21437\/Interspeech.2006-364"},{"key":"66_CR12","doi-asserted-by":"crossref","unstructured":"Ogbureke, K.U., Carson-Berndsen, J.: Improving initial boundary estimation for HMM-based automatic phonetic segmentation. In: Proceedings of Interspeech, Brighton, UK, pp. 884\u2013887 (2009)","DOI":"10.1109\/ICASSP.2010.5494978"},{"key":"66_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"672","DOI":"10.1007\/3-540-70659-3_70","volume-title":"Structural, Syntactic, and Statistical Pattern Recognition","author":"J.A. G\u00f3mez","year":"2002","unstructured":"G\u00f3mez, J.A., Castro, M.J.: Automatic Segmentation of Speech at the Phonetic Level. In: Caelli, T.M., Amin, A., Duin, R.P.W., Kamel, M.S., de Ridder, D. (eds.) SPR 2002 and SSPR 2002. LNCS, vol.\u00a02396, pp. 672\u2013680. Springer, Heidelberg (2002)"},{"key":"66_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"540","DOI":"10.1007\/978-3-642-14980-1_53","volume-title":"Structural, Syntactic, and Statistical Pattern Recognition","author":"J.A. G\u00f3mez","year":"2010","unstructured":"G\u00f3mez, J.A., Sanchis, E., Castro-Bleda, M.J.: Automatic Speech Segmentation Based on Acoustical Clustering. In: Hancock, E.R., Wilson, R.C., Windeatt, T., Ulusoy, I., Escolano, F. (eds.) SSPR&SPR 2010. LNCS, vol.\u00a06218, pp. 540\u2013548. Springer, Heidelberg (2010)"},{"key":"66_CR15","doi-asserted-by":"crossref","unstructured":"Moreno, A., Poch, D., Bonafonte, A., Lleida, E., Llisterri, J., Mari\u00f1o, J.B., Nadeu, C.: Albayzin Speech Database: Design of the Phonetic Corpus. In: Proceedings of Eurospeech, Berlin, Germany, vol.\u00a01, pp. 653\u2013656 (September 1993)","DOI":"10.21437\/Eurospeech.1993-66"},{"key":"66_CR16","unstructured":"TIMIT Acoustic-Phonetic Continuous Speech Corpus, National Institute of Standards and Technology Speech Disc 1-1.1, NTIS Order No. PB91-5050651996 (October 1990)"}],"container-title":["Lecture Notes in Computer Science","Progress in Pattern Recognition, Image Analysis, Computer Vision, and Applications"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-25085-9_66","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,11]],"date-time":"2023-06-11T02:25:34Z","timestamp":1686450334000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-25085-9_66"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9783642250842","9783642250859"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-25085-9_66","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2011]]}}}