{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,27]],"date-time":"2026-01-27T23:16:40Z","timestamp":1769555800256,"version":"3.49.0"},"reference-count":85,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T00:00:00Z","timestamp":1620864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T00:00:00Z","timestamp":1620864000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100003593","name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","doi-asserted-by":"publisher","award":["156956\/2018-7"],"award-info":[{"award-number":["156956\/2018-7"]}],"id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004612","name":"Funda\u00e7\u00e3o Arauc\u00e1ria","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004612","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002322","name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100002322","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003593","name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1007\/s10618-021-00762-8","type":"journal-article","created":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T18:03:00Z","timestamp":1620928980000},"page":"1564-1621","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Handling imbalance in hierarchical classification problems using local classifiers approaches"],"prefix":"10.1007","volume":"35","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1272-5378","authenticated-orcid":false,"given":"Rodolfo M.","family":"Pereira","sequence":"first","affiliation":[]},{"given":"Yandre M. G.","family":"Costa","sequence":"additional","affiliation":[]},{"suffix":"Jr.","given":"Carlos N.","family":"Silla","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,5,13]]},"reference":[{"key":"762_CR1","doi-asserted-by":"crossref","unstructured":"Ariyaratne HB, Zhang D (2012) A novel automatic hierachical approach to music genre classification. In: Proceedings of the IEEE international conference on multimedia and expo workshops, pp 564\u2013569","DOI":"10.1109\/ICMEW.2012.104"},{"key":"762_CR2","doi-asserted-by":"crossref","unstructured":"Bader-El-Den M, Teitei E, Perry T (2018) Biased random forest for dealing with the class imbalance problem. IEEE Trans Neural Netw Learn Syst","DOI":"10.1109\/TNNLS.2018.2878400"},{"key":"762_CR3","doi-asserted-by":"crossref","unstructured":"Bannour H, Hudelot C (2012) Hierarchical image annotation using semantic hierarchies. In: Proceedings of the 21st ACM international conference on Information and knowledge management, pp 2431\u20132434","DOI":"10.1145\/2396761.2398659"},{"issue":"1","key":"762_CR4","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"G Batista","year":"2004","unstructured":"Batista G, Prati R, Monard M (2004) A study of the behavior of several methods for balancing machine learning training data. ACM SIGKDD Explor Newsl 6(1):20\u201329","journal-title":"ACM SIGKDD Explor Newsl"},{"issue":"1","key":"762_CR5","doi-asserted-by":"crossref","first-page":"289","DOI":"10.1111\/j.2517-6161.1995.tb02031.x","volume":"57","author":"Y Benjamini","year":"1995","unstructured":"Benjamini Y, Hochberg Y (1995) Controlling the false discovery rate: a practical and powerful approach to multiple testing. J R Stat Soc Ser B (Methodol) 57(1):289\u2013300","journal-title":"J R Stat Soc Ser B (Methodol)"},{"key":"762_CR6","doi-asserted-by":"crossref","unstructured":"Bennett PN, Nguyen N (2009) Refined experts: improving classification in large taxonomies. In: Proceedings of the 32nd international ACM SIGIR conference on Research and development in information retrieval, pp 11\u201318","DOI":"10.1145\/1571941.1571946"},{"key":"762_CR7","first-page":"281","volume":"13","author":"J Bergstra","year":"2012","unstructured":"Bergstra J, Bengio Y (2012) Random search for hyper-parameter optimization. J Mach Learn Res 13:281\u2013305","journal-title":"J Mach Learn Res"},{"key":"762_CR8","doi-asserted-by":"crossref","unstructured":"Bunkhumpornpat C, Sinapiromsaran K, Lursinsap C (2009) Safe-level-smote: safe-level-synthetic minority oversampling technique for handling the class imbalanced problem. In: Pacific-Asia conference on knowledge discovery and data mining, Bangkok, Thailand, pp 475\u2013482","DOI":"10.1007\/978-3-642-01307-2_43"},{"key":"762_CR9","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1016\/j.patrec.2018.01.003","volume":"103","author":"FJ Castellanos","year":"2018","unstructured":"Castellanos FJ, Valero-Mas JJ, Calvo-Zaragoza J, Rico-Juan JR (2018) Oversampling imbalanced data in the string space. Pattern Recogn Lett 103:32\u201338","journal-title":"Pattern Recogn Lett"},{"key":"762_CR10","unstructured":"Cesa-Bianchi N, Valentini G (2009) Hierarchical cost-sensitive algorithms for genome-wide gene function prediction. In: Machine learning in systems biology, pp 14\u201329"},{"issue":"1\u20132","key":"762_CR11","doi-asserted-by":"publisher","first-page":"209","DOI":"10.1007\/s10994-011-5271-6","volume":"88","author":"N Cesa-Bianchi","year":"2012","unstructured":"Cesa-Bianchi N, Re M, Valentini G (2012) Synergy of multi-label hierarchical ensembles, data fusion, and cost-sensitive methods for gene functional inference. Mach Learn 88(1\u20132):209\u2013241","journal-title":"Mach Learn"},{"key":"762_CR12","doi-asserted-by":"crossref","unstructured":"Charte F, Rivera A, del Jesus MJ, Herrera F (2013) A first approach to deal with imbalance in multi-label datasets. In: Proceedings of the international conference on hybrid artificial intelligence systems, pp 150\u2013160","DOI":"10.1007\/978-3-642-40846-5_16"},{"key":"762_CR13","doi-asserted-by":"crossref","unstructured":"Charte F, Rivas AJR, del Jesus M, Herrera F (2014) MLeNN: a first approach to heuristic multilabel undersampling. In: Proceedings of the international conference on intelligent data engineering and automated learning, pp 1\u20139","DOI":"10.1007\/978-3-319-10840-7_1"},{"key":"762_CR14","doi-asserted-by":"crossref","unstructured":"Charte F, Rivera A, del Jesus M, Herrera F (2015a) Addressing imbalance in multilabel classification: measures and random resampling algorithms. J Neurocomputing 163:3\u201316","DOI":"10.1016\/j.neucom.2014.08.091"},{"key":"762_CR15","doi-asserted-by":"crossref","unstructured":"Charte F, Rivera A, del Jesus M, Herrera F (2015b) MLSMOTE: approaching imbalanced multilabel learning through synthetic instance generation. Knowl Based Syst 89:385\u2013397","DOI":"10.1016\/j.knosys.2015.07.019"},{"key":"762_CR16","doi-asserted-by":"crossref","unstructured":"Charuvaka A, Rangwala H (2015) Hiercost: improving large scale hierarchical classification with cost sensitive learning. In: Joint European conference on machine learning and knowledge discovery in databases. Springer, pp 675\u2013690","DOI":"10.1007\/978-3-319-23528-8_42"},{"key":"762_CR17","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"N Chawla","year":"2002","unstructured":"Chawla N, Bowyer K, Hall L, Kegelmeyer P (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"key":"762_CR18","doi-asserted-by":"crossref","unstructured":"Chen B, Hu J (2010) Hierarchical multi-label classification incorporating prior information for gene function prediction. In: 2010 10th International conference on intelligent systems design and applications. IEEE, pp 231\u2013236","DOI":"10.1109\/ISDA.2010.5687261"},{"issue":"2","key":"762_CR19","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1002\/tee.21714","volume":"7","author":"B Chen","year":"2012","unstructured":"Chen B, Hu J (2012) Hierarchical multi-label classification based on over-sampling and hierarchy constraint for gene function prediction. IEEJ Trans Electr Electron Eng 7(2):183\u2013189","journal-title":"IEEJ Trans Electr Electron Eng"},{"key":"762_CR20","doi-asserted-by":"crossref","unstructured":"Chen B, Duan L, Hu J (2012) Composite kernel based SVM for hierarchical multi-label gene function classification. In: Proceedings of the international joint conference on neural networks (IJCNN). IEEE, pp 1\u20136","DOI":"10.1109\/IJCNN.2012.6252555"},{"issue":"1","key":"762_CR21","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1007\/s10618-011-0222-1","volume":"24","author":"DA Cieslak","year":"2012","unstructured":"Cieslak DA, Hoens TR, Chawla NV, Kegelmeyer WP (2012) Hellinger distance decision trees are robust and skew-insensitive. Data Min Knowl Disc 24(1):136\u2013158","journal-title":"Data Min Knowl Disc"},{"issue":"11","key":"762_CR22","doi-asserted-by":"publisher","first-page":"1651","DOI":"10.1007\/s10994-018-5739-8","volume":"107","author":"JG Colonna","year":"2018","unstructured":"Colonna JG, Gama J, Nakamura EF (2018) A comparison of hierarchical multi-output recognition approaches for anuran classification. Mach Learn 107(11):1651\u20131671","journal-title":"Mach Learn"},{"key":"762_CR23","unstructured":"Defferrard M, Benzi K, Vandergheynst P, Bresson X (2017) FMA: A dataset for music analysis. In: Proceedings of the international society for music information retrieval conference, Suzhou, China, pp 316\u2013323"},{"issue":"5","key":"762_CR24","doi-asserted-by":"publisher","first-page":"638","DOI":"10.1109\/TKDE.2008.187","volume":"21","author":"C Diamantini","year":"2009","unstructured":"Diamantini C, Potena D (2009) Bayes vector quantizer for class-imbalance problem. IEEE Trans Knowl Data Eng 21(5):638\u2013651","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"10","key":"762_CR25","doi-asserted-by":"publisher","first-page":"2436","DOI":"10.1016\/j.patcog.2011.03.026","volume":"44","author":"I Dimitrovski","year":"2011","unstructured":"Dimitrovski I, Kocev D, Loskovska S, Dzeroski S (2011) Hierarchical annotation of medical images. Pattern Recogn 44(10):2436\u20132449","journal-title":"Pattern Recogn"},{"key":"762_CR26","doi-asserted-by":"crossref","unstructured":"Dumais S, Chen H (2000) Hierarchical classification of web content. In: Proceedings of the 23rd annual international ACM SIGIR conference on Research and development in information retrieval, pp 256\u2013263","DOI":"10.1145\/345508.345593"},{"issue":"293","key":"762_CR27","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1080\/01621459.1961.10482090","volume":"56","author":"OJ Dunn","year":"1961","unstructured":"Dunn OJ (1961) Multiple comparisons among means. J Am Stat Assoc 56(293):52\u201364","journal-title":"J Am Stat Assoc"},{"key":"762_CR28","unstructured":"Fagni T, Sebastiani F (2007) On the selection of negative examples for hierarchical text categorization. In: Proceedings of the language & technology conference, pp 24\u201328"},{"key":"762_CR29","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1016\/j.knosys.2013.01.018","volume":"42","author":"A Fern\u00e1ndez","year":"2013","unstructured":"Fern\u00e1ndez A, L\u00f3Pez V, Galar M, Del Jesus MJ, Herrera F (2013) Analysing the classification of imbalanced data-sets with multiple classes: binarization techniques and ad-hoc approaches. Knowl Based Syst 42:97\u2013110","journal-title":"Knowl Based Syst"},{"issue":"1","key":"762_CR30","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1016\/j.knosys.2011.05.002","volume":"25","author":"N Garc\u00eda-Pedrajas","year":"2012","unstructured":"Garc\u00eda-Pedrajas N, P\u00e9rez-Rodr\u00edguez J, Garc\u00eda-Pedrajas M, Ortiz-Boyer D, Fyfe C (2012) Class imbalance methods for translation initiation site recognition in DNA sequences. Knowl Based Syst 25(1):22\u201334","journal-title":"Knowl Based Syst"},{"issue":"3","key":"762_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2629585","volume":"9","author":"S Gopal","year":"2015","unstructured":"Gopal S, Yang Y (2015) Hierarchical Bayesian inference and recursive regularization for large-scale classification. ACM Trans Knowl Discov Data 9(3):1\u201323","journal-title":"ACM Trans Knowl Discov Data"},{"key":"762_CR32","doi-asserted-by":"crossref","unstructured":"Ha-Thuc V, Renders JM (2011) Large-scale hierarchical text classification without labelled data. In: Proceedings of the fourth ACM international conference on Web search and data mining, pp 685\u2013694","DOI":"10.1145\/1935826.1935919"},{"key":"762_CR33","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1016\/j.eswa.2016.12.035","volume":"73","author":"G Haixiang","year":"2017","unstructured":"Haixiang G, Yijing L, Shang J, Mingyun G, Yuanyue H, Bing G (2017) Learning from class-imbalanced data: review of methods and applications. Expert Syst Appl 73:220\u2013239","journal-title":"Expert Syst Appl"},{"key":"762_CR34","doi-asserted-by":"crossref","unstructured":"Han H, Wang WY, Mao BH (2005) Borderline-smote: a new oversampling method in imbalanced datasets learning. In: International conference on intelligent computing. Hefei, China, pp 878\u2013887","DOI":"10.1007\/11538059_91"},{"issue":"3","key":"762_CR35","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TIT.1968.1054155","volume":"14","author":"P Hart","year":"1968","unstructured":"Hart P (1968) The condensed nearest neighbor rule (corresp.). IEEE Trans Inf Theory 14(3):515\u2013516","journal-title":"IEEE Trans Inf Theory"},{"issue":"1","key":"762_CR36","first-page":"507","volume":"11","author":"T Hastie","year":"1998","unstructured":"Hastie T, Tibshirani R (1998) Classification by pairwise coupling. Adv Neural Inf Process Syst 11(1):507\u2013513","journal-title":"Adv Neural Inf Process Syst"},{"key":"762_CR37","unstructured":"He H, Bai Y, Garcia EA, Li S (2008) Adasyn: Adaptive synthetic sampling approach for imbalanced learning. In: IEEE international joint conference neural networks, Hong Kong, pp 1322\u20131328"},{"issue":"5","key":"762_CR38","doi-asserted-by":"publisher","first-page":"429","DOI":"10.3233\/IDA-2002-6504","volume":"6","author":"N Japkowicz","year":"2002","unstructured":"Japkowicz N, Stephen S (2002) The class imbalance problem: a systematic study. Intell Data Anal 6(5):429\u2013449","journal-title":"Intell Data Anal"},{"key":"762_CR39","doi-asserted-by":"crossref","unstructured":"Jeni LA, Cohn JF, De\u00a0La\u00a0Torre F (2013) Facing imbalanced data: recommendations for the use of performance metrics. In: Proceedings of the humaine association conference on affective computing and intelligent interaction, pp 245\u2013251","DOI":"10.1109\/ACII.2013.47"},{"issue":"1","key":"762_CR40","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1093\/biostatistics\/kxh026","volume":"6","author":"SH Jung","year":"2005","unstructured":"Jung SH, Bang H, Young S (2005) Sample size calculation for multiple testing in microarray data analysis. Biostatistics 6(1):157\u2013169","journal-title":"Biostatistics"},{"key":"762_CR41","unstructured":"Kiritchenko S, Matwin S, Famili F (2005) Functional annotation of genes using hierarchical text categorization. In: Proceedings of the ACL workshop on linking biological literature, Detroit, USA"},{"issue":"3","key":"762_CR42","doi-asserted-by":"publisher","first-page":"817","DOI":"10.1016\/j.patcog.2012.09.023","volume":"46","author":"D Kocev","year":"2013","unstructured":"Kocev D, Vens C, Struyf J, D\u017eeroski S (2013) Tree ensembles for predicting structured outputs. Pattern Recogn 46(3):817\u2013833","journal-title":"Pattern Recogn"},{"issue":"4","key":"762_CR43","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1007\/s13748-016-0094-0","volume":"5","author":"B Krawczyk","year":"2016","unstructured":"Krawczyk B (2016) Learning from imbalanced data: open challenges and future directions. Prog Artif Intell 5(4):221\u2013232","journal-title":"Prog Artif Intell"},{"key":"762_CR44","unstructured":"Kumar S, Rowley HA, Wang X, Rodrigues JJM (2015) Hierarchical classification in credit card data extraction. US Patent 9,213,907"},{"issue":"2","key":"762_CR45","doi-asserted-by":"publisher","first-page":"79","DOI":"10.2174\/157016461302160514000940","volume":"13","author":"D Li","year":"2016","unstructured":"Li D, Ju Y, Zou Q (2016) Protein folds prediction with hierarchical structured SVM. Curr Proteom 13(2):79\u201385","journal-title":"Curr Proteom"},{"key":"762_CR46","unstructured":"Mani I, Zhang I (2003) knn approach to unbalanced data distributions: a case study involving information extraction. In: Proceedings of workshop on learning from imbalanced datasets, Washington DC, USA, vol 126"},{"key":"762_CR47","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1016\/j.asw.2014.09.002","volume":"23","author":"DS McNamara","year":"2015","unstructured":"McNamara DS, Crossley SA, Roscoe RD, Allen LK, Dai J (2015) A hierarchical classification approach to automated essay scoring. Assess Writ 23:35\u201359","journal-title":"Assess Writ"},{"key":"762_CR48","doi-asserted-by":"publisher","first-page":"36671","DOI":"10.1038\/srep36671","volume":"6","author":"B Mieth","year":"2016","unstructured":"Mieth B, Kloft M, Rodr\u00edguez JA, Sonnenburg S, Vobruba R, Morcillo-Su\u00e1rez C, Farr\u00e9 X, Marigorta UM, Fehr E, Dickhaus T (2016) Combining multiple hypothesis testing with machine learning increases the statistical power of genome-wide association studies. Sci Rep 6:36671","journal-title":"Sci Rep"},{"issue":"3","key":"762_CR49","first-page":"69","volume":"24","author":"MM Mukaka","year":"2012","unstructured":"Mukaka MM (2012) A guide to appropriate use of correlation coefficient in medical research. Malawi Med J 24(3):69\u201371","journal-title":"Malawi Med J"},{"issue":"3","key":"762_CR50","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1145\/2911172.2911182","volume":"2","author":"A Naik","year":"2016","unstructured":"Naik A, Rangwala H (2016) Large-scale hierarchical classification with rare categories and inconsistencies. AI Matters 2(3):27\u201329","journal-title":"AI Matters"},{"key":"762_CR51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01620-3","volume-title":"Large scale hierarchical classification: state of the art","author":"A Naik","year":"2018","unstructured":"Naik A, Rangwala H (2018) Large scale hierarchical classification: state of the art. Springer, Berlin"},{"issue":"1","key":"762_CR52","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1007\/s10844-018-0509-4","volume":"52","author":"A Naik","year":"2019","unstructured":"Naik A, Rangwala H (2019) Improving large-scale hierarchical classification by rewiring: a data-driven filter based approach. J Intell Inf Syst 52(1):141\u2013164","journal-title":"J Intell Inf Syst"},{"issue":"1","key":"762_CR53","doi-asserted-by":"publisher","first-page":"485","DOI":"10.1186\/s12859-019-3060-6","volume":"20","author":"FK Nakano","year":"2019","unstructured":"Nakano FK, Lietaert M, Vens C (2019) Machine learning for discovering missing or wrong protein function annotations. BMC Bioinform 20(1):485","journal-title":"BMC Bioinform"},{"key":"762_CR54","doi-asserted-by":"crossref","unstructured":"Napiera\u0142a K, Stefanowski J, Wilk S (2010) Learning from imbalanced data in presence of noisy and borderline examples. International conference on rough sets and current trends in computing, Warsaw, Poland, pp 158\u2013167","DOI":"10.1007\/978-3-642-13529-3_18"},{"issue":"1","key":"762_CR55","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1186\/s12859-017-1854-y","volume":"18","author":"M Notaro","year":"2017","unstructured":"Notaro M, Schubach M, Robinson PN, Valentini G (2017) Prediction of human phenotype ontology terms by means of hierarchical ensemble methods. BMC Bioinform 18(1):449","journal-title":"BMC Bioinform"},{"issue":"1","key":"762_CR56","doi-asserted-by":"publisher","first-page":"S6","DOI":"10.1186\/gb-2008-9-s1-s6","volume":"9","author":"G Obozinski","year":"2008","unstructured":"Obozinski G, Lanckriet G, Grant C, Jordan MI, Noble WS (2008) Consistent probabilistic outputs for protein function prediction. Genome Biol 9(1):S6","journal-title":"Genome Biol"},{"issue":"3","key":"762_CR57","first-page":"394","volume":"3","author":"BC Paes","year":"2012","unstructured":"Paes BC, Plastino A, Freitas AA (2012) Improving local per level hierarchical classification. J Inf Data Manag 3(3):394\u2013394","journal-title":"J Inf Data Manag"},{"key":"762_CR58","doi-asserted-by":"crossref","unstructured":"Partalas I, Kosmopoulos A, Baskiotis N, Arti\u00e8res T, Paliouras G, Gaussier \u00c9, Androutsopoulos I, Amini M, Gallinari P (2015) LSHTC: a benchmark for large-scale text classification. CoRR abs\/1503.08581","DOI":"10.1145\/2556195.2556208"},{"key":"762_CR59","unstructured":"Pereira RM, da\u00a0Costa YMG, Silla\u00a0Jr CN (2018) Dealing with imbalanceness in hierarchical multi-label datasets using multi-label resampling techniques. In: IEEE 30th international conference on tools with artificial intelligence (ICTAI), pp 818\u2013824"},{"key":"762_CR60","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1016\/j.neucom.2019.11.076","volume":"383","author":"RM Pereira","year":"2020","unstructured":"Pereira RM, Costa YM, Silla CN Jr (2020) MLTL: a multi-label approach for the Tomek link undersampling algorithm. Neurocomputing 383:95\u2013105","journal-title":"Neurocomputing"},{"key":"762_CR61","first-page":"101","volume":"5","author":"R Rifkin","year":"2004","unstructured":"Rifkin R, Klautau A (2004) In defense of one-vs-all classification. J Mach Learn Res 5:101\u2013141","journal-title":"J Mach Learn Res"},{"key":"762_CR62","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1016\/j.neucom.2018.01.060","volume":"286","author":"A Roy","year":"2018","unstructured":"Roy A, Cruz RMO, Sabourin R, Cavalcanti GDC (2018) A study on combining dynamic selection and data preprocessing for imbalance learning. Neurocomputing 286:179\u2013192","journal-title":"Neurocomputing"},{"issue":"18","key":"762_CR63","doi-asserted-by":"publisher","first-page":"5539","DOI":"10.1093\/nar\/gkh894","volume":"32","author":"A Ruepp","year":"2004","unstructured":"Ruepp A, Zollner A, Maier D, Albermann K, Hani J, Mokrejs M, Tetko I, G\u00fcldener U, Mannhaupt G, M\u00fcnsterk\u00f6tter M et al (2004) The FunCat, a functional annotation scheme for systematic classification of proteins from whole genomes. Nucleic Acids Res 32(18):5539\u20135545","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"762_CR64","doi-asserted-by":"publisher","first-page":"064960","DOI":"10.1155\/2007\/64960","volume":"2007","author":"JG Sarnal Barbedo","year":"2006","unstructured":"Sarnal Barbedo JG, Lopes A (2006) Automatic genre classification of musical signals. EURASIP J Adv Signal Process 2007(1):064960","journal-title":"EURASIP J Adv Signal Process"},{"issue":"1","key":"762_CR65","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-11-2","volume":"11","author":"L Schietgat","year":"2010","unstructured":"Schietgat L, Vens C, Struyf J, Blockeel H, Kocev D, D\u017eeroski S (2010) Predicting gene function using hierarchical multi-label decision tree ensembles. BMC Bioinform 11(1):1\u201314","journal-title":"BMC Bioinform"},{"key":"762_CR66","doi-asserted-by":"crossref","unstructured":"Silla CN Jr, Freitas AA (2009) Novel top-down approaches for hierarchical classification and their application to automatic music genre classification. In: 2009 IEEE international conference on systems, man and cybernetics. IEEE, pp 3499\u20133504","DOI":"10.1109\/ICSMC.2009.5346776"},{"issue":"1\u20132","key":"762_CR67","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1007\/s10618-010-0175-9","volume":"22","author":"CN Silla Jr","year":"2011","unstructured":"Silla CN Jr, Freitas AA (2011) A survey of hierarchical classification across different application domains. Data Min Knowl Disc 22(1\u20132):31\u201372","journal-title":"Data Min Knowl Disc"},{"issue":"1","key":"762_CR68","doi-asserted-by":"publisher","first-page":"21","DOI":"10.26555\/ijain.v4i1.146","volume":"4","author":"OS Sitompul","year":"2018","unstructured":"Sitompul OS, Nababan EB et al (2018) Biased support vector machine and weighted-smote in handling class imbalance problem. Int J Adv Intell Inform 4(1):21\u201327","journal-title":"Int J Adv Intell Inform"},{"key":"762_CR69","doi-asserted-by":"crossref","unstructured":"Sokolova M, Japkowicz N, Szpakowicz S (2006) Beyond accuracy, F-score and ROC: a family of discriminant measures for performance evaluation. In: Proceedings of the Australasian joint conference on artificial intelligence, pp 1015\u20131021","DOI":"10.1007\/11941439_114"},{"key":"762_CR70","doi-asserted-by":"publisher","first-page":"107146","DOI":"10.1016\/j.patcog.2019.107146","volume":"100","author":"R Soleymani","year":"2020","unstructured":"Soleymani R, Granger E, Fumera G (2020) F-measure curves: a tool to visualize classifier performance under imbalance. Pattern Recogn 100:107146","journal-title":"Pattern Recogn"},{"key":"762_CR71","doi-asserted-by":"crossref","unstructured":"Song Y, Roth D (2014) On dataless hierarchical text classification. In: Twenty-eighth AAAI conference on artificial intelligence","DOI":"10.1609\/aaai.v28i1.8938"},{"key":"762_CR72","doi-asserted-by":"crossref","unstructured":"Stefanowski J, Wilk S (2008) Selective pre-processing of imbalanced data for improving classification performance. In: International conference on data warehousing and knowledge discovery, Italy, Turin, pp 283\u2013292","DOI":"10.1007\/978-3-540-85836-2_27"},{"key":"762_CR73","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1016\/j.ins.2018.09.001","volume":"471","author":"RA Stein","year":"2019","unstructured":"Stein RA, Jaques PA, Valiati JF (2019) An analysis of hierarchical text classification using word embeddings. Inf Sci 471:216\u2013232","journal-title":"Inf Sci"},{"issue":"12","key":"762_CR74","doi-asserted-by":"publisher","first-page":"3358","DOI":"10.1016\/j.patcog.2007.04.009","volume":"40","author":"Y Sun","year":"2007","unstructured":"Sun Y, Kamel MS, Wong AK, Wang Y (2007) Cost-sensitive boosting for classification of imbalanced data. Pattern Recogn 40(12):3358\u20133378","journal-title":"Pattern Recogn"},{"key":"762_CR75","first-page":"3","volume":"1","author":"B Szalkai","year":"2018","unstructured":"Szalkai B, Grolmusz V, Hancock J (2018) Seclaf: a webserver and deep neural network design tool for hierarchical biological sequence classification. Bioinformatics 1:3","journal-title":"Bioinformatics"},{"key":"762_CR76","doi-asserted-by":"publisher","first-page":"12360","DOI":"10.1109\/ACCESS.2019.2892120","volume":"7","author":"H Tang","year":"2019","unstructured":"Tang H, Wang Y, Tang S, Chu D, Li C (2019) A randomized clustering forest approach for efficient prediction of protein functions. IEEE Access 7:12360\u201312372","journal-title":"IEEE Access"},{"issue":"6","key":"762_CR77","first-page":"448","volume":"6","author":"I Tomek","year":"1976","unstructured":"Tomek I (1976) An experiment with the edited nearest-neighbor rule. IEEE Trans Syst Man Cybern 6(6):448\u2013452","journal-title":"IEEE Trans Syst Man Cybern"},{"key":"762_CR78","doi-asserted-by":"crossref","unstructured":"Tsoumakas G, Vlahavas I (2007) Random k-labelsets: an ensemble method for multilabel classification. In: European conference on machine learning. Springer, pp 406\u2013417","DOI":"10.1007\/978-3-540-74958-5_38"},{"issue":"2","key":"762_CR79","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1007\/s10994-008-5077-3","volume":"73","author":"C Vens","year":"2008","unstructured":"Vens C, Struyf J, Schietgat L, D\u017eeroski S, Blockeel H (2008) Decision trees for hierarchical multi-label classification. Mach Learn 73(2):185","journal-title":"Mach Learn"},{"issue":"4","key":"762_CR80","doi-asserted-by":"publisher","first-page":"1119","DOI":"10.1109\/TSMCB.2012.2187280","volume":"42","author":"S Wang","year":"2012","unstructured":"Wang S, Yao X (2012) Multiclass imbalance problems: analysis and potential solutions. IEEE Trans Syst Man Cybern Part B (Cybern) 42(4):1119\u20131130","journal-title":"IEEE Trans Syst Man Cybern Part B (Cybern)"},{"key":"762_CR81","first-page":"5533","volume":"33","author":"C Xu","year":"2019","unstructured":"Xu C, Geng X (2019) Hierarchical classification based on label distribution learning. Proc AAAI Conf Artif Intell 33:5533\u20135540","journal-title":"Proc AAAI Conf Artif Intell"},{"issue":"3","key":"762_CR82","doi-asserted-by":"publisher","first-page":"5718","DOI":"10.1016\/j.eswa.2008.06.108","volume":"36","author":"SJ Yen","year":"2009","unstructured":"Yen SJ, Lee YS (2009) Cluster-based under-sampling approaches for imbalanced data distributions. Expert Syst Appl 36(3):5718\u20135727","journal-title":"Expert Syst Appl"},{"key":"762_CR83","doi-asserted-by":"publisher","first-page":"192","DOI":"10.1016\/j.asoc.2018.04.049","volume":"69","author":"L Yu","year":"2018","unstructured":"Yu L, Zhou R, Tang L, Chen R (2018) A DBN-based resampling SVM ensemble learning paradigm for credit classification with imbalanced data. Appl Soft Comput 69:192\u2013202","journal-title":"Appl Soft Comput"},{"issue":"3","key":"762_CR84","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1007\/s10115-007-0079-1","volume":"15","author":"H Zhao","year":"2008","unstructured":"Zhao H (2008) Instance weighting versus threshold adjusting for cost-sensitive classification. Knowl Inf Syst 15(3):321\u2013334","journal-title":"Knowl Inf Syst"},{"issue":"3","key":"762_CR85","doi-asserted-by":"publisher","first-page":"232","DOI":"10.1111\/j.1467-8640.2010.00358.x","volume":"26","author":"ZH Zhou","year":"2010","unstructured":"Zhou ZH, Liu XY (2010) On multi-class cost-sensitive learning. Comput Intell 26(3):232\u2013257","journal-title":"Comput Intell"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-021-00762-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10618-021-00762-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-021-00762-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,30]],"date-time":"2024-08-30T20:58:48Z","timestamp":1725051528000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10618-021-00762-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,13]]},"references-count":85,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["762"],"URL":"https:\/\/doi.org\/10.1007\/s10618-021-00762-8","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"value":"1384-5810","type":"print"},{"value":"1573-756X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,5,13]]},"assertion":[{"value":"30 August 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 May 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 May 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}