{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,5]],"date-time":"2026-04-05T20:24:54Z","timestamp":1775420694459,"version":"3.50.1"},"reference-count":52,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2018,12,1]],"date-time":"2018-12-01T00:00:00Z","timestamp":1543622400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100007514","name":"Universit\u00e0 di Pisa","doi-asserted-by":"publisher","award":["PRA 2017"],"award-info":[{"award-number":["PRA 2017"]}],"id":[{"id":"10.13039\/501100007514","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100011033","name":"Agencia Estatal de Investigaci\u00f3n","doi-asserted-by":"publisher","award":["TIN2013-46638-C3-3-P"],"award-info":[{"award-number":["TIN2013-46638-C3-3-P"]}],"id":[{"id":"10.13039\/501100011033","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100008530","name":"European Regional Development Fund","doi-asserted-by":"publisher","award":["TIN2016-77902-C3-1-P"],"award-info":[{"award-number":["TIN2016-77902-C3-1-P"]}],"id":[{"id":"10.13039\/501100008530","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003176","name":"Ministerio de Educaci\u00f3n, Cultura y Deporte","doi-asserted-by":"publisher","award":["FPU12\/05102"],"award-info":[{"award-number":["FPU12\/05102"]}],"id":[{"id":"10.13039\/501100003176","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1186\/s40537-018-0159-y","type":"journal-article","created":{"date-parts":[[2018,12,12]],"date-time":"2018-12-12T07:01:10Z","timestamp":1544598070000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Building efficient fuzzy regression trees for large scale and high dimensional problems"],"prefix":"10.1186","volume":"5","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7996-6104","authenticated-orcid":false,"given":"Javier","family":"C\u00f3zar","sequence":"first","affiliation":[]},{"given":"Francesco","family":"Marcelloni","sequence":"additional","affiliation":[]},{"given":"Jos\u00e9 A.","family":"G\u00e1mez","sequence":"additional","affiliation":[]},{"given":"Luis","family":"de la Ossa","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,12,12]]},"reference":[{"key":"159_CR1","doi-asserted-by":"publisher","first-page":"285","DOI":"10.4137\/EBO.S40912","volume":"12","author":"N Arana-Daniel","year":"2016","unstructured":"Arana-Daniel N, Gallegos AA, L\u00f3pez-Franco C, Alan\u00eds AY, Morales J, L\u00f3pez-Franco A. Support vector machines trained with evolutionary algorithms employing kernel adatron for large scale classification of protein structures. Evol Bioinform. 2016;12:285\u2013302.","journal-title":"Evol Bioinform"},{"key":"159_CR2","doi-asserted-by":"crossref","unstructured":"Bacardit J, Krasnogor N. The icos psp benchmarks repository; 2008. http:\/\/ico2s.org\/datasets\/psp_benchmark.html . Accessed 3 Dec 2018.","DOI":"10.1145\/1527055.1527056"},{"issue":"1","key":"159_CR3","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1016\/j.ins.2003.09.018","volume":"165","author":"F Berzal","year":"2004","unstructured":"Berzal F, Cubero JC, Mar\u0131n N, S\u00e1nchez D. Building multi-way decision trees with numerical attributes. Inf Sci. 2004;165(1):73\u201390.","journal-title":"Inf Sci"},{"issue":"1","key":"159_CR4","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L. Random forests. Mach Learn. 2001;45(1):5\u201332.","journal-title":"Mach Learn"},{"key":"159_CR5","volume-title":"Classification and regression trees","author":"L Breiman","year":"1984","unstructured":"Breiman L, Friedman JH, Olshen RA, Stone CJ. Classification and regression trees. Monterey: Wadsworth & Brooks; 1984."},{"issue":"3\u20134","key":"159_CR6","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1016\/S0020-0255(96)00141-7","volume":"96","author":"HD Cheng","year":"1997","unstructured":"Cheng HD, Chen JR. Automatically determine the membership function based on the maximum entropy principle. Inf Sci. 1997;96(3\u20134):163\u201382.","journal-title":"Inf Sci"},{"key":"159_CR7","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.asoc.2014.03.003","volume":"21","author":"J C\u00f3zar","year":"2014","unstructured":"C\u00f3zar J, delaOssa L, G\u00e1mez JA. Learning tsk-0 linguistic fuzzy rules by means of local search algorithms. Appl Soft Comput. 2014;21:57\u201371.","journal-title":"Appl Soft Comput"},{"key":"159_CR8","doi-asserted-by":"crossref","unstructured":"C\u00f3zar J, delaOssa L, G\u00e1mez JA. Tsk-0 fuzzy rule-based systems for high-dimensional problems using the apriori principle for rule generation. In: Rough sets and current trends in computing, lecture notes in computer science, vol 8536. New York: Springer International Publishing; 2014. p. 270\u20139.","DOI":"10.1007\/978-3-319-08644-6_28"},{"issue":"1","key":"159_CR9","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean J, Ghemawat S. Mapreduce: simplified data processing on large clusters. Commun ACM. 2008;51(1):107\u201313.","journal-title":"Commun ACM"},{"key":"159_CR10","volume-title":"Fuzzy sets in decision analysis, operations research and statistics","author":"R Slowi\u0144ski","year":"2012","unstructured":"Slowi\u0144ski R. Fuzzy sets in decision analysis, operations research and statistics, vol 1. US: Springer; 2012."},{"issue":"2","key":"159_CR11","doi-asserted-by":"publisher","first-page":"832","DOI":"10.1109\/TPWRS.2009.2016528","volume":"24","author":"R Diao","year":"2009","unstructured":"Diao R, Sun K, Vittal V, O\u2019Keefe RJ, Richardson MR, Bhatt N, Stradford D, Sarawgi SK. Decision tree-based online voltage security assessment using pmu measurements. IEEE Trans Power Syst. 2009;24(2):832\u20139.","journal-title":"IEEE Trans Power Syst"},{"issue":"1\u20133","key":"159_CR12","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/S0165-0114(83)80099-2","volume":"10","author":"D Dubois","year":"1983","unstructured":"Dubois D, Prade H. Unfair coins and necessity measures: towards a possibilistic interpretation of histograms. Fuzzy Sets and Systems. 1983;10(1\u20133):15\u201320.","journal-title":"Fuzzy Sets and Systems"},{"issue":"5","key":"159_CR13","doi-asserted-by":"publisher","first-page":"572","DOI":"10.1001\/jama.293.5.572","volume":"293","author":"GC Fonarow","year":"2005","unstructured":"Fonarow GC, Adams KF, Abraham WT, Yancy CW, Boscardin WJ, Committee ASA. Risk stratification for in-hospital mortality in acutely decompensated heart failure: classification and regression tree analysis. JAMA. 2005;293(5):572\u201380.","journal-title":"JAMA"},{"issue":"2","key":"159_CR14","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1007\/BF02985802","volume":"27","author":"J Franklin","year":"2005","unstructured":"Franklin J. The elements of statistical learning: data mining, inference and prediction. Math Intell. 2005;27(2):83\u20135.","journal-title":"Math Intell"},{"issue":"4","key":"159_CR15","doi-asserted-by":"publisher","first-page":"734","DOI":"10.1109\/TKDE.2012.35","volume":"25","author":"S Garcia","year":"2013","unstructured":"Garcia S, Luengo J, S\u00e1ez JA, Lopez V, Herrera F. A survey of discretization techniques: taxonomy and empirical analysis in supervised learning. IEEE Trans Knowl Data Eng. 2013;25(4):734\u201350.","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"159_CR16","volume-title":"The decision tree: taking control of your health in the new era of personalized medicine","author":"T Goetz","year":"2010","unstructured":"Goetz T. The decision tree: taking control of your health in the new era of personalized medicine. Emmaus: Rodale; 2010."},{"issue":"9","key":"159_CR17","doi-asserted-by":"publisher","first-page":"816","DOI":"10.1016\/j.spl.2010.01.015","volume":"80","author":"A Gupta","year":"2010","unstructured":"Gupta A, Mehrotra KG, Mohan C. A clustering-based discretization for supervised learning. Stat Probab Lett. 2010;80(9):816\u201324.","journal-title":"Stat Probab Lett"},{"key":"159_CR18","unstructured":"Haskell RE. Regression tree fuzzy systems. In: Proceedings of the ICSC symposium on soft computing, fuzzy logic, artificial neural networks and genetic algorithms, University of Reading, Whiteknights, Reading, England; 1996. p. 26\u20138."},{"key":"159_CR19","series-title":"Springer series in statistics","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-21606-5","volume-title":"The elements of statistical learning: data mining, inference, and prediction","author":"T Hastie","year":"2001","unstructured":"Hastie T, Tibshirani R, Friedman J. The elements of statistical learning: data mining, inference, and prediction. Springer series in statistics, vol 10, 1st ed. New York: Springer; 2001.","edition":"1"},{"issue":"1","key":"159_CR20","doi-asserted-by":"publisher","first-page":"176","DOI":"10.1021\/ci000336s","volume":"41","author":"S Izrailev","year":"2001","unstructured":"Izrailev S, Agrafiotis D. A novel method for building regression tree models for qsar based on artificial ant colony systems. J Chem Inf Comput Sci. 2001;41(1):176\u201380.","journal-title":"J Chem Inf Comput Sci"},{"key":"159_CR21","doi-asserted-by":"publisher","first-page":"580","DOI":"10.1109\/TSMC.1985.6313426","volume":"4","author":"JM Keller","year":"1985","unstructured":"Keller JM, Gray MR, Givens JA. A fuzzy k-nearest neighbor algorithm. IEEE Trans Syst Man Cybern. 1985;4:580\u20135.","journal-title":"IEEE Trans Syst Man Cybern"},{"issue":"454","key":"159_CR22","doi-asserted-by":"publisher","first-page":"589","DOI":"10.1198\/016214501753168271","volume":"96","author":"H Kim","year":"2001","unstructured":"Kim H, Loh WY. Classification trees with unbiased multiway splits. J Am Stat Assoc. 2001;96(454):589\u2013604.","journal-title":"J Am Stat Assoc"},{"issue":"1","key":"159_CR23","first-page":"47","volume":"32","author":"S Kotsiantis","year":"2006","unstructured":"Kotsiantis S, Kanellopoulos D. Discretization techniques: a recent survey. GESTS Int Trans Comput Sci Eng. 2006;32(1):47\u201358.","journal-title":"GESTS Int Trans Comput Sci Eng"},{"key":"159_CR24","doi-asserted-by":"publisher","first-page":"267","DOI":"10.3354\/meps321267","volume":"321","author":"J Leathwick","year":"2006","unstructured":"Leathwick J, Elith J, Francis M, Hastie T, Taylor P. Variation in demersal fish species richness in the oceans surrounding new zealand: an analysis using boosted regression trees. Mar Ecol Prog Ser. 2006;321:267\u201381.","journal-title":"Mar Ecol Prog Ser"},{"key":"159_CR25","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139924801","volume-title":"Mining of massive datasets","author":"J Leskovec","year":"2014","unstructured":"Leskovec J, Rajaraman A, Ullman JD. Mining of massive datasets. Cambridge: Cambridge University Press; 2014."},{"key":"159_CR26","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139924801","volume-title":"Mining of massive datasets","author":"J Leskovec","year":"2014","unstructured":"Leskovec J, Rajaraman A, Ullman JD. Mining of massive datasets. Cambridge: Cambridge university press; 2014."},{"issue":"4","key":"159_CR27","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1023\/A:1016304305535","volume":"6","author":"H Liu","year":"2002","unstructured":"Liu H, Hussain F, Tan CL, Dash M. Discretization: an enabling technique. Data Mining Knowl Discov. 2002;6(4):393\u2013423.","journal-title":"Data Mining Knowl Discov"},{"key":"159_CR28","doi-asserted-by":"crossref","unstructured":"Maciel AI, Costa IG, Lorena AC Measuring the complexity of regression problems. In: 2016 international joint conference on neural networks (IJCNN). New York: IEEE; 2016. p. 1450\u20137.","DOI":"10.1109\/IJCNN.2016.7727369"},{"issue":"3\u20134","key":"159_CR29","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1016\/S0888-613X(98)10017-8","volume":"19","author":"S Medasani","year":"1998","unstructured":"Medasani S, Kim J, Krishnapuram R. An overview of membership function generation techniques for pattern recognition. Int J Approx Reason. 1998;19(3\u20134):391\u2013417.","journal-title":"Int J Approx Reason"},{"key":"159_CR30","unstructured":"Meng X. Mllib: Scalable machine learning on spark. In: Spark Workshop April; 2014."},{"key":"159_CR31","doi-asserted-by":"crossref","unstructured":"Mori H, Kosemura N, Ishiguro K, Kondo T. Short-term load forecasting with fuzzy regression tree in power systems. In: 2001 IEEE international conference on systems, man, and cybernetics, vol\u00a03. New York: IEEE; 2001. p. 1948\u201353.","DOI":"10.1109\/ICSMC.2001.973654"},{"key":"159_CR32","doi-asserted-by":"crossref","unstructured":"Nieradka G, Butkiewicz B. A method for automatic membership function estimation based on fuzzy measures. In: International fuzzy systems association world congress. Berlin: Springer; 2007. p. 451\u201360","DOI":"10.1007\/978-3-540-72950-1_45"},{"issue":"2","key":"159_CR33","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1016\/S0165-0114(03)00089-7","volume":"138","author":"C Olaru","year":"2003","unstructured":"Olaru C, Wehenkel L. A complete fuzzy decision tree technique. Fuzzy Sets Syst. 2003;138(2):221\u201354.","journal-title":"Fuzzy Sets Syst"},{"issue":"1","key":"159_CR34","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1016\/0165-0114(94)90003-5","volume":"64","author":"W Pedrycz","year":"1994","unstructured":"Pedrycz W. Why triangular membership functions? Fuzzy Sets Syst. 1994;64(1):21\u201330.","journal-title":"Fuzzy Sets Syst"},{"issue":"2","key":"159_CR35","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1007\/s10021-005-0054-1","volume":"9","author":"AM Prasad","year":"2006","unstructured":"Prasad AM, Iverson LR, Liaw A. Newer classification and regression tree techniques: bagging and random forests for ecological prediction. Ecosystems. 2006;9(2):181\u201399.","journal-title":"Ecosystems"},{"key":"159_CR36","unstructured":"Quinlan RJ. Learning with continuous classes. In: 5th Australian joint conference on artificial intelligence. Singapore: World Scientific; 1992. p. 343\u20138."},{"key":"159_CR37","doi-asserted-by":"publisher","first-page":"35","DOI":"10.2307\/2531894","volume":"44","author":"MR Segal","year":"1988","unstructured":"Segal MR. Regression trees for censored data. Biometrics. 1988;44:35\u201347.","journal-title":"Biometrics"},{"issue":"1","key":"159_CR38","doi-asserted-by":"publisher","first-page":"174","DOI":"10.1109\/TFUZZ.2016.2646746","volume":"26","author":"A Segatori","year":"2018","unstructured":"Segatori A, Marcelloni F, Pedrycz W. On distributed fuzzy decision trees for big data. IEEE Trans Fuzzy Syst. 2018;26(1):174\u201392.","journal-title":"IEEE Trans Fuzzy Syst"},{"issue":"12","key":"159_CR39","doi-asserted-by":"publisher","first-page":"1297","DOI":"10.1109\/34.817409","volume":"21","author":"A Su\u00e1rez","year":"1999","unstructured":"Su\u00e1rez A, Lutsko JF. Globally optimal fuzzy decision trees for classification and regression. IEEE Trans Pattern Anal Mach Intell. 1999;21(12):1297\u2013311.","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"159_CR40","unstructured":"Tang K, Li X, Suganthan PN, Yang Z, Weise T. Benchmark functions for the cec2010 special session and competition on large-scale global optimization. Tech. rep. nature inspired computation and applications laboratory; 2009."},{"key":"159_CR41","unstructured":"Wager S Asymptotic theory for random forests. arXiv preprint; 2014. arXiv:14050352 ."},{"key":"159_CR42","unstructured":"Ward JS, Barker A. Undefined by data: a survey of big data definitions. arXiv preprint; 2013. arXiv:13095821 ."},{"key":"159_CR43","unstructured":"Weber R. Fuzzy-id3: a class of methods for automatic knowledge acquisition. In: Proceedings of the 2nd international conference on fuzzy logic and neural networks; 1992."},{"issue":"4","key":"159_CR44","doi-asserted-by":"publisher","first-page":"383","DOI":"10.1016\/S0958-1669(98)80012-8","volume":"9","author":"DR Westhead","year":"1998","unstructured":"Westhead DR, Thornton JM. Protein structure prediction. Curr Opin Biotechnol. 1998;9(4):383\u20139.","journal-title":"Curr Opin Biotechnol"},{"key":"159_CR45","volume-title":"Hadoop: the definitive guide","author":"T White","year":"2012","unstructured":"White T. Hadoop: the definitive guide. Sebastopol: O\u2019Reilly Media, Inc.; 2012."},{"issue":"6","key":"159_CR46","doi-asserted-by":"publisher","first-page":"80","DOI":"10.2307\/3001968","volume":"1","author":"F Wilcoxon","year":"1945","unstructured":"Wilcoxon F. Individual comparisons by ranking methods. Biometrics Bull. 1945;1(6):80\u20133.","journal-title":"Biometrics Bull"},{"issue":"2","key":"159_CR47","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1016\/0165-0114(94)00229-Z","volume":"69","author":"Y Yuan","year":"1995","unstructured":"Yuan Y, Shaw MJ. Induction of fuzzy decision trees. Fuzzy Sets Syst. 1995;69(2):125\u201339.","journal-title":"Fuzzy Sets Syst"},{"key":"159_CR48","unstructured":"Zaharia M. Apache Spark MLlib; 2009. http:\/\/spark.apache.org\/mllib\/ . Accessed 26 Sept 2017."},{"issue":"10\u201310","key":"159_CR49","first-page":"95","volume":"10","author":"M Zaharia","year":"2010","unstructured":"Zaharia M, Chowdhury M, Franklin MJ, Shenker S, Stoica I. Spark: cluster computing with working sets. HotCloud. 2010;10(10\u201310):95.","journal-title":"HotCloud"},{"key":"159_CR50","doi-asserted-by":"publisher","first-page":"715","DOI":"10.1016\/j.ins.2014.03.087","volume":"278","author":"M Zeinalkhani","year":"2014","unstructured":"Zeinalkhani M, Eftekhari M. Fuzzy partitioning of continuous attributes through discretization methods to construct fuzzy decision tree classifiers. Inf Sci. 2014;278:715\u201335.","journal-title":"Inf Sci"},{"issue":"4","key":"159_CR51","doi-asserted-by":"publisher","first-page":"1029","DOI":"10.1073\/pnas.0407152101","volume":"102","author":"Y Zhang","year":"2005","unstructured":"Zhang Y, Skolnick J. The protein structure prediction problem could be solved using the current pdb library. Proc Natl Acad Sci. 2005;102(4):1029\u201334.","journal-title":"Proc Natl Acad Sci"},{"key":"159_CR52","doi-asserted-by":"crossref","unstructured":"Zheng Y, Liu L, Wang L, Xie X. Learning transportation mode from raw gps data for geographic applications on the web. In: Proceedings of the 17th international conference on World Wide Web, New York: ACM; 2008. p. 247\u201356.","DOI":"10.1145\/1367497.1367532"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-018-0159-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s40537-018-0159-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-018-0159-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T11:47:10Z","timestamp":1775303230000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-018-0159-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,12]]},"references-count":52,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["159"],"URL":"https:\/\/doi.org\/10.1186\/s40537-018-0159-y","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,12]]},"assertion":[{"value":"22 August 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 November 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 December 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"49"}}