{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,14]],"date-time":"2025-10-14T01:09:04Z","timestamp":1760404144879},"reference-count":62,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2014,2,15]],"date-time":"2014-02-15T00:00:00Z","timestamp":1392422400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2015,3]]},"DOI":"10.1007\/s10618-014-0345-2","type":"journal-article","created":{"date-parts":[[2014,2,17]],"date-time":"2014-02-17T16:53:08Z","timestamp":1392655988000},"page":"358-399","source":"Crossref","is-referenced-by-count":17,"title":["Using the minimum description length to discover the intrinsic cardinality and dimensionality of time series"],"prefix":"10.1007","volume":"29","author":[{"given":"Bing","family":"Hu","sequence":"first","affiliation":[]},{"given":"Thanawin","family":"Rakthanmanon","sequence":"additional","affiliation":[]},{"given":"Yuan","family":"Hao","sequence":"additional","affiliation":[]},{"given":"Scott","family":"Evans","sequence":"additional","affiliation":[]},{"given":"Stefano","family":"Lonardi","sequence":"additional","affiliation":[]},{"given":"Eamonn","family":"Keogh","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,2,15]]},"reference":[{"key":"345_CR1","doi-asserted-by":"crossref","unstructured":"Assent I, Krieger R, Afschari F, Seidl T (2008) The TS-Tree: Efficient Time Series Search and Retrieval. In: EDBT. ACM, New York","DOI":"10.1145\/1353343.1353376"},{"key":"345_CR2","doi-asserted-by":"crossref","first-page":"3196","DOI":"10.1016\/j.bpj.2009.09.031","volume":"97","author":"JE Bronson","year":"2009","unstructured":"Bronson JE, Fei J, Hofman JM, Gonzalez RL, Wiggins CH (2009) Learning rates and states from biophysical time series: a Bayesian approach to model selection and single-molecule FRET data. Biophys J 97:3196\u20133205","journal-title":"Biophys J"},{"key":"345_CR3","doi-asserted-by":"crossref","unstructured":"Camerra A, Palpanas T, Shieh J, Keogh E (2010) $$i$$ i SAX 2.0: indexing and mining one billion time series. In: International conference on data mining","DOI":"10.1109\/ICDM.2010.124"},{"key":"345_CR4","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1145\/1541880.1541882","volume":"41","author":"V Chandola","year":"2009","unstructured":"Chandola V, Banerjee A, Kumar V (2009) Anomaly detection: a survey. ACM Comput Surv 41:3","journal-title":"ACM Comput Surv"},{"key":"345_CR5","doi-asserted-by":"crossref","first-page":"834","DOI":"10.1111\/j.1467-9892.2008.00585.x","volume":"29","author":"RA Davis","year":"2008","unstructured":"Davis RA, Lee TCM, Rodriguez-Yam G (2008) Break detection for a class of nonlinear time series models. J Time Ser Anal 29:834\u2013867","journal-title":"J Time Ser Anal"},{"key":"345_CR6","doi-asserted-by":"crossref","unstructured":"De Rooij S, Vit\u00e1nyi P (2012) Approximating rate-distortion graphs of individual data: experiments in Lossy compression and denoising. IEEE Trans Comput 61(3):395\u2013407","DOI":"10.1109\/TC.2011.25"},{"key":"345_CR7","doi-asserted-by":"crossref","unstructured":"Ding H, Trajcevski G, Scheuermann P, Wang X, Keogh E (2008) Querying and mining of time series data: experimental comparison of representations and distance measures. In: VLDB, Auckland, pp 1542\u20131552","DOI":"10.14778\/1454159.1454226"},{"key":"345_CR8","doi-asserted-by":"crossref","first-page":"425","DOI":"10.1093\/biomet\/81.3.425","volume":"81","author":"DL Donoho","year":"1994","unstructured":"Donoho DL, Johnstone IM (1994) Ideal spatial adaptation via wavelet shrinkage. J Biometrika 81:425\u2013455","journal-title":"J Biometrika"},{"key":"345_CR9","doi-asserted-by":"crossref","unstructured":"Evans SC et al (2007) Microrna target detection and analysis for genes related to breast cancer using MDL compress. EURASIP J Bioinform Syst Biol 1\u201316","DOI":"10.1155\/2007\/43670"},{"key":"345_CR10","unstructured":"Firoiu L, Cohen PR (2002) Segmenting time series with a hybrid neural networks hidden Markov model. In: Proceedings of 8th national conference on artificial Intelligence, p 247"},{"key":"345_CR11","doi-asserted-by":"crossref","unstructured":"Garc\u00eda-L\u00f3pez D, Acosta-Mesa H (2009) Discretization of time series dataset with a genetic search. In: MICAI. Springer, Berlin, pp 201\u2013212","DOI":"10.1007\/978-3-642-05258-3_18"},{"key":"345_CR12","unstructured":"Goebel K, Saha B, Saxena A (2008) A comparsion of three data-driven techniques for prognostics. In: Failure prevention for system availability, 62th meeting of the MFPT Society, pp 119\u2013131"},{"key":"345_CR13","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/1114.001.0001","volume-title":"Advances in minimum description length: theory and applications","author":"PD Gr\u00fcnwald","year":"2005","unstructured":"Gr\u00fcnwald PD, Myung IJ, Pitt MA (2005) Advances in minimum description length: theory and applications. MIT, Cambridge"},{"key":"345_CR14","doi-asserted-by":"crossref","unstructured":"Heimes FO, BAE Systems (2008) Recurrent neural networks for remaining useful life estimation. In: International conference on prognostics and health management","DOI":"10.1109\/PHM.2008.4711422"},{"key":"345_CR15","doi-asserted-by":"crossref","unstructured":"Hu B, Rakthanmanon T, Hao Y, Evans S, Lonardi S, Keogh E (2011) Discovering the intrinsic cardinality and dimensionality of time series using MDL. In: ICDM","DOI":"10.1109\/ICDM.2011.54"},{"key":"345_CR16","unstructured":"International Business Machiness (IBM) (2012) Harness the power of big data. www.public.dhe.ibm.com\/common\/ssi\/ecm\/en\/imm14100usen\/IMM14100USEN.PDF . Accessed 7 Nov 2012"},{"key":"345_CR17","unstructured":"Jonyer I, Holder LB, Cook DJ (2004) Attribute-value selection based on minimum description length. In: International conference on artificial intelligence"},{"key":"345_CR18","doi-asserted-by":"crossref","unstructured":"Kehagias Ath (2004) A hidden Markov model segmentation procedure for hydrological and enviromental time series. Stoch Environ Res Risk Assess 18:117\u2013130","DOI":"10.1007\/s00477-003-0145-5"},{"key":"345_CR19","unstructured":"Keogh E, Chu S, Hart D, Pazzani M (2011) An online algorithm for segmenting time series. In: KDD"},{"key":"345_CR20","doi-asserted-by":"crossref","unstructured":"Keogh E, Kasetty S (2003) On the need for time series data mining benchmarks: a survey and empirical demonstration. J Data Min Knowl Discov 7(4):349\u2013371","DOI":"10.1023\/A:1024988512476"},{"key":"345_CR21","doi-asserted-by":"crossref","unstructured":"Keogh E, Pazzani MJ (2000) A simple dimensionality reduction technique for fast similarity search in large time series databases. In: PAKDD, pp 122\u2013133","DOI":"10.1007\/3-540-45571-X_14"},{"key":"345_CR22","unstructured":"Keogh E, Zhu Q, Hu B, Hao Y, Xi X, Wei L, Ratanamahatana CA (2006) The UCR time series classification \/clustering. www.cs.ucr.edu\/~eamonn\/time_series_data\/"},{"key":"345_CR23","unstructured":"Kontkanen P, Myllym P (2007) \u201cMDL histogram density estimation. In: Proceedings of the eleventh international workshop on artificial intelligence and statistics"},{"key":"345_CR24","doi-asserted-by":"crossref","unstructured":"Lemire D (2007) A better alternative to piecewise linear time series segmentation. In: SDM","DOI":"10.1137\/1.9781611972771.59"},{"key":"345_CR25","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4757-2606-0","volume-title":"An introduction to Kolmogorov complexity and its applications","author":"M Li","year":"1997","unstructured":"Li M (1997) An introduction to Kolmogorov complexity and its applications, 2nd edn. Springer, Berlin","edition":"2"},{"key":"345_CR26","unstructured":"Lin J, Keogh E, Lonardi S, Patel P (2002) Finding motifs in time series. In: Proceedings of 2nd workshop on temporal data mining"},{"issue":"2","key":"345_CR27","first-page":"107","volume":"15","author":"J Lin","year":"2007","unstructured":"Lin J, Keogh E, Wei L, Lonardi S (2007) Experiencing SAX: a novel symbolic representation of time series. J DMKD 15(2):107\u2013144","journal-title":"J DMKD"},{"key":"345_CR28","unstructured":"Linacre E, Geerts B (2011) Resources in atmospheric science, 2002. http:\/\/www-das.uwyo.edu\/~geerts\/cwx\/notes\/chap15\/global_temp.html . Accessed 1 Dec 2011"},{"key":"345_CR29","first-page":"31","volume":"78","author":"K Malatesta","year":"2005","unstructured":"Malatesta K, Beck S, Menali G, Waagen E (2005) The AAVSO data validation project. J Am Assoc Variable Star Observ (JAAVSO) 78:31\u201344","journal-title":"J Am Assoc Variable Star Observ (JAAVSO)"},{"key":"345_CR30","doi-asserted-by":"crossref","first-page":"046207","DOI":"10.1103\/PhysRevE.80.046207","volume":"80","author":"YI Molkov","year":"2009","unstructured":"Molkov YI, Mukhin DN, Loskutov EM, Feigin AM (2009) Using the minimum description length principle for global reconstruction of dynamic systems from noisy time series. Phys Rev E 80:046207","journal-title":"Phys Rev E"},{"key":"345_CR31","doi-asserted-by":"crossref","unstructured":"M\u00f6rchen F, Ultsch A (2005) Optimizing time series discretization for knowledge discovery. In: KDD","DOI":"10.1145\/1081870.1081953"},{"key":"345_CR32","unstructured":"National Aeronautics and Space Administration (2011) GISS surface temperature analysis. http:\/\/data.giss.nasa.gov\/gistemp\/ . Accessed 1 Dec 2011"},{"issue":"7","key":"345_CR33","doi-asserted-by":"crossref","first-page":"992","DOI":"10.1109\/TKDE.2007.190737","volume":"20","author":"T Palpanas","year":"2008","unstructured":"Palpanas T, Vlachos M, Keogh E, Gunopulos D (2008) Streaming time series summarization using user-defined amnesic functions. IEEE Trans Knowl Data Eng 20(7):992\u20131006","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"345_CR34","doi-asserted-by":"crossref","unstructured":"Papadimitriou S, Gionis A, Tsaparas P, V\u00e4is\u00e4nen A, Mannila H, Faloutsos C (2005) Parameter-free spatial data mining using MDL. In: ICDM","DOI":"10.1109\/ICDM.2005.117"},{"key":"345_CR35","unstructured":"Pednault EPD (1989) Some experiments in applying inductive inference principles to surface reconstruction. In: IJCAI, pp 1603\u20131609"},{"key":"345_CR36","unstructured":"PHM Data Challenge Competition (2008). phmconf.orgjOCS\/index.php\/phm\/2008\/challenge"},{"key":"345_CR37","doi-asserted-by":"crossref","first-page":"29","DOI":"10.3189\/172756407782871684","volume":"47","author":"G Picard","year":"2007","unstructured":"Picard G, Fily M, Gallee H (2007) Surface melting derived from microwave radiometers: a climatic indicator in Antarctica. Ann Glaciol 47:29\u201334","journal-title":"Ann Glaciol"},{"key":"345_CR38","doi-asserted-by":"crossref","first-page":"677","DOI":"10.1111\/j.1365-2966.2006.10327.x","volume":"369","author":"P Protopapas","year":"2006","unstructured":"Protopapas P, Giammarco JM, Faccioli L, Struble MF, Dave R, Alcock C (2006) Finding outlier light-curves in catalogs of periodic variable stars. Monthly Not R Astron Soc 369:677\u2013696","journal-title":"Monthly Not R Astron Soc"},{"key":"345_CR39","unstructured":"Prognostics Center of Excellence, National Aeronautics and Space Administration (NASA) (2012). ti.arc.nasa.gov\/tech\/dash\/pcoe\/prognostic-data-repository\/. Accessed 7 Nov 2012"},{"key":"345_CR40","unstructured":"Project URL. www.cs.ucr.edu\/~bhu002\/MDL\/MDL.html . This URL contains all data and code used in this paper, as well as many additional experiments omitted for brevity"},{"issue":"2","key":"345_CR41","doi-asserted-by":"crossref","first-page":"371","DOI":"10.1007\/s10115-012-0508-7","volume":"33","author":"T Rakthanmanon","year":"2012","unstructured":"Rakthanmanon T, Keogh E, Lonardi S, Evans S (2012) MDL-based time series clustering. Knowl Inf Syst 33(2):371\u2013399","journal-title":"Knowl Inf Syst"},{"issue":"3","key":"345_CR42","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1007\/s10994-008-5093-3","volume":"74","author":"U Rebbapragada","year":"2009","unstructured":"Rebbapragada U, Protopapas P, Brodley CE, Alcock CR (2009) Finding anomalous periodic time series. Mach Learn 74(3):281\u2013313","journal-title":"Mach Learn"},{"key":"345_CR43","volume-title":"Stochastic complexity in statistical inquiry","author":"J Rissanen","year":"1989","unstructured":"Rissanen J (1989) Stochastic complexity in statistical inquiry. World Scientific, Singapore"},{"key":"345_CR44","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1109\/18.119689","volume":"38","author":"J Rissanen","year":"1992","unstructured":"Rissanen J, Speed T, Yu B (1992) Density estimation by stochastic complexity. IEEE Trans Inf Theory 38:315\u2013323","journal-title":"IEEE Trans Inf Theory"},{"key":"345_CR45","doi-asserted-by":"crossref","unstructured":"Salvador S, Chan P (2004) Determining the number of clusters\/segments in hierarchical clustering\/segmentation algorithms. In: International conference on tools with artificial intelligence, pp 576\u2013584","DOI":"10.1109\/ICTAI.2004.50"},{"key":"345_CR46","unstructured":"Sarle W (1999) Donoho\u2013Johnstone benchmarks: neural net results. ftp.sas.com\/pub\/neural\/dojo\/dojo.html"},{"key":"345_CR47","doi-asserted-by":"crossref","unstructured":"Sart D, Mueen A, Najjar W, Niennattrakul V, Keogh E (2010) Accelerating dynamic time warping subsequence search with GPUs and FPGAs. In: IEEE international conference on data mining, pp 1001\u20131006","DOI":"10.1109\/ICDM.2010.21"},{"key":"345_CR48","unstructured":"Signal to Noise Ratio. http:\/\/en.wikipedia.org\/wiki\/Signal-to-noise_ratio"},{"key":"345_CR49","unstructured":"US Environmental Protection Agency (2011) Climate Change Science. www.epa.gov\/climatechange\/science\/recenttc.html . Accessed 6 Dec 2011"},{"key":"345_CR50","doi-asserted-by":"crossref","unstructured":"Vachtsevanos G, Lewis FL, Roemer M, Hess A, Wu B (2006) Intelligent fault diagnosis and prognosis for engineering systems, 1st edn. Wiley, Hoboken","DOI":"10.1002\/9780470117842"},{"key":"345_CR51","doi-asserted-by":"crossref","unstructured":"Vahdatpour A, Sarrafzadeh M (2010) Unsupervised discovery of abnormal activity occurrences in multi-dimensional time series, with applications in wearable systems. In: SIAM international conference on data mining","DOI":"10.1137\/1.9781611972801.56"},{"key":"345_CR52","doi-asserted-by":"crossref","unstructured":"Vatauv R (2012) The impact of motion dimensionality and bit cardinality on the design of 3D gesture recognizers. Int J Hum\u2013Comput Stud 71(4):387\u2013409","DOI":"10.1016\/j.ijhcs.2012.11.005"},{"key":"345_CR53","unstructured":"vbFRET Toolbox (2012) www.vbFRET.sourceforge.net . Accessed 8 Nov 2012"},{"issue":"7","key":"345_CR54","doi-asserted-by":"crossref","first-page":"3438","DOI":"10.1109\/TIT.2010.2048491","volume":"56","author":"N Vereshchagin","year":"2010","unstructured":"Vereshchagin N, Vitanyi P (2010) Rate distortion and denoising of individual data using Kolmogorov complexity. IEEE Trans Inf Theory 56(7):3438\u20133454","journal-title":"IEEE Trans Inf Theory"},{"key":"345_CR55","doi-asserted-by":"crossref","unstructured":"Vespier U, Knobbe A, Nijssen S, Vanschoren J (2012) MDL-based analysis of time series at multiple time-scales. Lecture notes in computer science (LNCS), vol 7524. Springer, Berlin","DOI":"10.1007\/978-3-642-33486-3_24"},{"issue":"2","key":"345_CR56","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1093\/comjnl\/11.2.185","volume":"11","author":"CS Wallace","year":"1968","unstructured":"Wallace CS, Boulton DM (1968) An information measure for classification. Comput J 11(2):185\u2013194","journal-title":"Comput J"},{"key":"345_CR57","unstructured":"Wang T, Lee J (2006) On performance evaluation of prognostics algorithms. In: Proceedings of MFPT, pp 219\u2013226"},{"key":"345_CR58","doi-asserted-by":"crossref","unstructured":"Wang T, Yu J, Siegel D, Lee J (2008) A similarity-based prognostics approach for remaining useful life estimation of engineered systems. In: International conference on prognostics and health management","DOI":"10.1109\/PHM.2008.4711421"},{"key":"345_CR59","volume-title":"Managing gigabytes compressing and indexing documents and images","author":"H Witten","year":"1999","unstructured":"Witten H, Moffat A, Bell TC (1999) Managing gigabytes compressing and indexing documents and images. Morgan Kaufmann, San Francisco"},{"issue":"2","key":"345_CR60","doi-asserted-by":"crossref","first-page":"241","DOI":"10.1007\/s10115-008-0131-9","volume":"17","author":"D Yankov","year":"2008","unstructured":"Yankov D, Keogh E, Rebbapragada U (2008) Disk aware discord discovery: finding unusual time series in terabyte sized datasets. Knowl Inf Syst 17(2):241\u2013262","journal-title":"Knowl Inf Syst"},{"key":"345_CR61","doi-asserted-by":"crossref","unstructured":"Zhao Q, Hautamaki V, Franti P (2008) Knee point detection in BIC for detecting the number of clusters. In: ACIVS, vol 5259, pp 664\u2013673","DOI":"10.1007\/978-3-540-88458-3_60"},{"key":"345_CR62","doi-asserted-by":"crossref","unstructured":"Zwally HJ, Gloersen P (1977) Passive microwave images of the polar regions and research applications. Polar Rec 18:431\u2013450","DOI":"10.1017\/S0032247400000930"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-014-0345-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10618-014-0345-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-014-0345-2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,7]],"date-time":"2019-08-07T18:08:06Z","timestamp":1565201286000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10618-014-0345-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,2,15]]},"references-count":62,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2015,3]]}},"alternative-id":["345"],"URL":"https:\/\/doi.org\/10.1007\/s10618-014-0345-2","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"value":"1384-5810","type":"print"},{"value":"1573-756X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,2,15]]}}}