{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,21]],"date-time":"2025-12-21T06:25:55Z","timestamp":1766298355197},"reference-count":46,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"8","license":[{"start":{"date-parts":[[2013,8,1]],"date-time":"2013-08-01T00:00:00Z","timestamp":1375315200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2013,8]]},"DOI":"10.1109\/tasl.2013.2260744","type":"journal-article","created":{"date-parts":[[2013,5,1]],"date-time":"2013-05-01T11:57:19Z","timestamp":1367409439000},"page":"1742-1754","source":"Crossref","is-referenced-by-count":9,"title":["Model-Based Multiple Pitch Tracking Using Factorial HMMs: Model Adaptation and Inference"],"prefix":"10.1109","volume":"21","author":[{"given":"Michael","family":"Wohlmayr","sequence":"first","affiliation":[]},{"given":"Franz","family":"Pernkopf","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511804441"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-45528-0"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4959533"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/89.279273"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/89.876308"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/89.279278"},{"key":"ref37","first-page":"1969","article-title":"EM-based gain adaptation for probabilistic multipitch tracking","author":"wohlmayr","year":"2011","journal-title":"Proc Int Conf Spoken Lang Process"},{"key":"ref36","first-page":"24","article-title":"The Iroquois model: Using temporal dynamics to separate speakers","author":"rennie","year":"2006","journal-title":"Proc Workshop Statist Percept Audition"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495323"},{"key":"ref34","first-page":"89","article-title":"Speech recognition using factorial hidden Markov models for separation in the feature space","author":"virtanen","year":"2006","journal-title":"Proc Int Conf Spoken Lang Process"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"788","DOI":"10.1038\/44565","article-title":"Learning the parts of objects by nonnegative matrix factorization","volume":"401","author":"lee","year":"1999","journal-title":"Nature"},{"key":"ref40","author":"petersen","year":"2008","journal-title":"The Matrix Cookbook"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.876726"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.885253"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2009.02.006"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2010.938081"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2008.11.001"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2064309"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1121\/1.405712"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2004.832812"},{"key":"ref19","author":"christensen","year":"2008","journal-title":"Multi-Pitch Estimation"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1006\/csla.1995.0010"},{"key":"ref4","year":"2006","journal-title":"Computational Auditory Scene Analysis Principles Algorithms and Applications"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2009.5373446"},{"key":"ref3","doi-asserted-by":"crossref","DOI":"10.1201\/9781420015836","author":"loizou","year":"2007","journal-title":"Speech Enhancement Theory and Practice"},{"key":"ref6","author":"roweis","year":"2000","journal-title":"Advances in Neural Information Processing Systems (NIPS'00)"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1006\/csla.1996.0013"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"1009","DOI":"10.21437\/Eurospeech.2003-345","article-title":"Factorial models and refiltering for speech separation and denoising","author":"roweis","year":"2003","journal-title":"Proc 8th Eur Conf Speech Commun Technol (Eurospeech)"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"140","DOI":"10.1007\/978-3-642-15995-4_18","volume":"6365","author":"mysore","year":"2010","journal-title":"Latent Variable Analysis and Signal Separation"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ASPAA.2011.6082324"},{"key":"ref2","author":"benesty","year":"2007","journal-title":"Springer Handbook of Speech Processing"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1121\/1.1907229"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ASPAA.2009.5346527"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2003.811539"},{"key":"ref20","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-642-81926-1","author":"hess","year":"1983","journal-title":"Pitch Determination of Speech Signals Algorithms and Devices"},{"key":"ref45","first-page":"495","article-title":"A robust algorithm for pitch tracking (RAPT)","author":"talkin","year":"1995","journal-title":"Speech Coding and Synthesis Elsevier"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1990.115970"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007425814087"},{"key":"ref24","author":"wohlmayr","year":"2012","journal-title":"Probabilistic model-based multiple pitch tracking of speech"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/978-94-011-5014-9_12"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/29.35387"},{"key":"ref41","author":"moon","year":"2000","journal-title":"Mathematical Methods and Algorithms for Signal Processing"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1121\/1.2229005"},{"key":"ref26","author":"mclachlan","year":"1988","journal-title":"Mixture Models Inference and Applications to Clustering"},{"key":"ref43","first-page":"1509","article-title":"A pitch tracking corpus with evaluation on multipitch tracking scenario","author":"pirker","year":"2011","journal-title":"Proc Int Conf Spoken Lang Process"},{"key":"ref25","first-page":"1","article-title":"Maximum likelihood from incomplete data via the EM algorithm","volume":"b30","author":"dempster","year":"1977","journal-title":"J Roy Statist Soc"}],"container-title":["IEEE Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10376\/6508879\/06510492.pdf?arnumber=6510492","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,9]],"date-time":"2024-05-09T22:37:36Z","timestamp":1715294256000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6510492\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,8]]},"references-count":46,"journal-issue":{"issue":"8"},"URL":"https:\/\/doi.org\/10.1109\/tasl.2013.2260744","relation":{},"ISSN":["1558-7916","1558-7924"],"issn-type":[{"value":"1558-7916","type":"print"},{"value":"1558-7924","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,8]]}}}