{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:39:38Z","timestamp":1740123578896,"version":"3.37.3"},"reference-count":15,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2012,12,5]],"date-time":"2012-12-05T00:00:00Z","timestamp":1354665600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2015,2]]},"DOI":"10.1007\/s10462-012-9374-7","type":"journal-article","created":{"date-parts":[[2012,12,4]],"date-time":"2012-12-04T14:45:48Z","timestamp":1354632348000},"page":"301-310","source":"Crossref","is-referenced-by-count":3,"title":["The number of classes as a source for instability of decision tree algorithms in high dimensional datasets"],"prefix":"10.1007","volume":"43","author":[{"given":"Jos\u00e9 Augusto","family":"Baranauskas","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,12,5]]},"reference":[{"issue":"1","key":"9374_CR1","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"GEAPA Batista","year":"2004","unstructured":"Batista GEAPA, Prati RC, Monard MC (2004) A study of the behavior of several methods for balancing machine learning training data. SIGKDD Explor Newsl 6(1):20\u201329","journal-title":"SIGKDD Explor Newsl"},{"key":"9374_CR2","first-page":"499","volume":"2","author":"O Bousquet","year":"2002","unstructured":"Bousquet O, Elisseeff A (2002) Stability and generalization. J Mach Learn Res 2:499\u2013526","journal-title":"J Mach Learn Res"},{"issue":"6","key":"9374_CR3","doi-asserted-by":"crossref","first-page":"2350","DOI":"10.1214\/aos\/1032181158","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L (1996a) Heuristics of instability and stabilization in model selection. Ann Stat 24(6):2350\u20132383","journal-title":"Ann Stat"},{"key":"9374_CR4","doi-asserted-by":"crossref","unstructured":"Breiman L (1996b) Technical note: some properties of splitting criteria. Mach Learn 24(1):41\u201347. doi: 10.1023\/A:1018094028462","DOI":"10.1023\/A:1018094028462"},{"key":"9374_CR5","volume-title":"Classification and regression tress","author":"L Breiman","year":"1984","unstructured":"Breiman L, Friedman J, Olshen R, Stone C (1984) Classification and regression tress. Wadsworth & Books, Pacific Grove, CA"},{"key":"9374_CR6","doi-asserted-by":"crossref","DOI":"10.1145\/312129.312220","volume-title":"MetaCost: a general method for making classifiers cost-sensitive","author":"P Domingos","year":"1999","unstructured":"Domingos P (1999) MetaCost: a general method for making classifiers cost-sensitive. ACM, San Diego, CA"},{"issue":"4","key":"9374_CR7","doi-asserted-by":"crossref","first-page":"269","DOI":"10.1016\/j.jbi.2004.07.007","volume":"37","author":"D Gamberger","year":"2004","unstructured":"Gamberger D, Lavra\u010d N, Zelezn\u00fd F, Tolar J (2004) Induction of comprehensible models for gene expression datasets by subgroup discovery methodology. J Biomed Inform 37(4):269\u2013284","journal-title":"J Biomed Inform"},{"key":"9374_CR8","doi-asserted-by":"crossref","unstructured":"Li RH, Belford GG (2002) Instability of decision tree classification algorithms. In: Proceedings of the eighth ACM SIGKDD international conference on knowledge discovery and data mining, pp 570\u2013575. ACM, New York, NY, USA, KDD \u201902. doi: 10.1145\/775047.775131 . http:\/\/doi.acm.org\/10.1145\/775047.775131","DOI":"10.1145\/775047.775131"},{"key":"9374_CR9","unstructured":"Perez PS, Baranauskas JA (2011) Analysis of decision tree pruning using windowing in medical datasets with different class distributions. In: Proceedings of the ECML PKDD workshop on knowledge discovery in health care and medicine (European conference on machine learning and principles and practice of knowledge discovery in databases), pp 28\u201339. Athens, Greece, ECML PKDD KD-HCM 2011. http:\/\/www.cs.gmu.edu\/~hrangwal\/kd-hcm\/proc\/papers\/3-Perez-Baranauskas.pdf"},{"key":"9374_CR10","doi-asserted-by":"crossref","unstructured":"Polo JL, Berzal F, Cubero JC (2008) Class-oriented reduction of decision tree complexity. In: Proceedings of the 17th international conference on foundations of intelligent systems, pp 48\u201357. Springer, Berlin, Heidelberg, ISMIS\u201908. http:\/\/portal.acm.org\/citation.cfm?id=1786474.1786481","DOI":"10.1007\/978-3-540-68123-6_5"},{"key":"9374_CR11","volume-title":"C4.5: programs for machine learning","author":"JR Quinlan","year":"1993","unstructured":"Quinlan JR (1993) C4.5: programs for machine learning. Morgan Kaufmann, San Francisco, CA"},{"issue":"4","key":"9374_CR12","doi-asserted-by":"crossref","first-page":"462","DOI":"10.1038\/nbt1392","volume":"26","author":"N Rosenfeld","year":"2008","unstructured":"Rosenfeld N, Aharonov R, Meiri E, Rosenwald S, Spector Y, Zepeniuk M, Benjamin H, Shabes N, Tabak S, Levy A et al (2008) Micrornas accurately identify cancer tissue origin. Nat Biotechnol 26(4):462\u2013469","journal-title":"Nat Biotechnol"},{"key":"9374_CR13","doi-asserted-by":"crossref","unstructured":"Souto M, Bittencourt V, Costa J (2006) An empirical analysis of under-sampling techniques to balance a protein structural class dataset. In: King I, Wang J, Chan L, Wang D (eds) Neural information processing, Lecture notes in computer science, vol 4234, pp 21\u201329. Springer, Berlin. http:\/\/dx.doi.org\/10.1007\/11893295_3","DOI":"10.1007\/11893295_3"},{"key":"9374_CR14","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1613\/jair.1199","volume":"19","author":"GM Weiss","year":"2003","unstructured":"Weiss GM, Provost F (2003) Learning when training data are costly: the effect of class distribution on tree induction. J Artif Intell Res 19:315\u2013354","journal-title":"J Artif Intell Res"},{"key":"9374_CR15","volume-title":"Text mining: predictive methods for analyzing unstructured information","author":"SM Weiss","year":"2004","unstructured":"Weiss SM, Indurkhya N, Zhang T, Damerau F (2004) Text mining: predictive methods for analyzing unstructured information. Springer, Berlin"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-012-9374-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10462-012-9374-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-012-9374-7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,7,6]],"date-time":"2019-07-06T11:45:47Z","timestamp":1562413547000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10462-012-9374-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,12,5]]},"references-count":15,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2015,2]]}},"alternative-id":["9374"],"URL":"https:\/\/doi.org\/10.1007\/s10462-012-9374-7","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"type":"print","value":"0269-2821"},{"type":"electronic","value":"1573-7462"}],"subject":[],"published":{"date-parts":[[2012,12,5]]}}}