{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:24:45Z","timestamp":1740122685383,"version":"3.37.3"},"reference-count":33,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,11,29]],"date-time":"2024-11-29T00:00:00Z","timestamp":1732838400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,29]],"date-time":"2024-11-29T00:00:00Z","timestamp":1732838400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62136002","61876027"],"award-info":[{"award-number":["62136002","61876027"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1007\/s10489-024-05961-6","type":"journal-article","created":{"date-parts":[[2024,11,29]],"date-time":"2024-11-29T00:52:54Z","timestamp":1732841574000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Ensemble microbial classification based on space partitioning and data augmentation"],"prefix":"10.1007","volume":"55","author":[{"given":"Liu-Ying","family":"Wen","sequence":"first","affiliation":[]},{"given":"Zhu","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Fan","family":"Min","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,29]]},"reference":[{"key":"5961_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-642-22993-0_1","volume":"2011","author":"A Andoni","year":"2011","unstructured":"Andoni A (2011) Nearest neighbor search in high-dimensional spaces. Math Found Comput 2011:1\u20131. https:\/\/doi.org\/10.1007\/978-3-642-22993-0_1","journal-title":"Math Found Comput"},{"key":"5961_CR2","doi-asserted-by":"publisher","first-page":"101644","DOI":"10.1016\/j.jocs.2022.101644","volume":"61","author":"B Anthony","year":"2021","unstructured":"Anthony B, Nabil A, Bastien C (2021) Toward informed partitioning for load balancing: A proof-of-concept. J Comput Sci 61:101644. https:\/\/doi.org\/10.1016\/j.jocs.2022.101644","journal-title":"J Comput Sci"},{"key":"5961_CR3","doi-asserted-by":"publisher","first-page":"821861","DOI":"10.3389\/fbinf.2022.821861","volume":"2","author":"G Armstrong","year":"2022","unstructured":"Armstrong G, Rahman G, Martino C, McDonald D, Gonzalez A, Mishne G, Knight R (2022) Applications and comparison of dimensionality reduction methods for microbiome data. Front Bioinform 2:821861. https:\/\/doi.org\/10.3389\/fbinf.2022.821861","journal-title":"Front Bioinform"},{"issue":"2","key":"5961_CR4","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1109\/TKDE.2012.232","volume":"26","author":"S Barua","year":"2014","unstructured":"Barua S, Islam MM, Yao X, Murase K (2014) Mwmote-majority weighted minority oversampling technique for imbalanced data set learning. IEEE Trans Knowl Data Eng 26(2):405\u201342. https:\/\/doi.org\/10.1109\/TKDE.2012.232","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"5961_CR5","unstructured":"Bernhardsson E, et\u00a0al. (2018) Annoy (approximate nearest neighbors oh yeah). https:\/\/github.com\/spotify\/annoy"},{"key":"5961_CR6","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u201335. https:\/\/doi.org\/10.1613\/jair.953","journal-title":"J Artif Intell Res"},{"issue":"10","key":"5961_CR7","doi-asserted-by":"publisher","first-page":"1624","DOI":"10.1109\/TNN.2010.2066988","volume":"21","author":"S Chen","year":"2010","unstructured":"Chen S, He H, Garcia EA (2010) Ramoboost: Ranked minority oversampling in boosting. IEEE Trans Neural Netw 21(10):1624\u20131642. https:\/\/doi.org\/10.1109\/TNN.2010.2066988","journal-title":"IEEE Trans Neural Netw"},{"key":"5961_CR8","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1016\/j.inffus.2023.02.013","volume":"95","author":"ZL Chen","year":"2023","unstructured":"Chen ZL, Fu LL, Yao J, Guo WZ, Plant C, Wang SP (2023) Learnable graph convolutional network and feature fusion for multi-view learning. Inform Fusion 95:109\u201311. https:\/\/doi.org\/10.1016\/j.inffus.2023.02.013","journal-title":"Inform Fusion"},{"issue":"1","key":"5961_CR9","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1109\/TSMCA.2009.2029559","volume":"40","author":"S Chris","year":"2010","unstructured":"Chris S, Taghi MK, Jason VH, Amri N (2010) Rusboost: A hybrid approach to alleviating class imbalance. IEEE Trans Syst Man Cybern Syst Hum 40(1):185\u2013197. https:\/\/doi.org\/10.1109\/TSMCA.2009.2029559","journal-title":"IEEE Trans Syst Man Cybern Syst Hum"},{"issue":"1","key":"5961_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40168-022-01439-0","volume":"10","author":"T Dang","year":"2022","unstructured":"Dang T, Kumaishi K, Usui E, Kobori S, Sato T, Toda Y, Yamasaki Y, Tsujimoto H, Ichihashi Y, Iwata H (2022) Stochastic variational variable selection for high-dimensional microbiome data. Microbiome 10(1):1\u201318. https:\/\/doi.org\/10.1186\/s40168-022-01439-0","journal-title":"Microbiome"},{"issue":"8","key":"5961_CR11","doi-asserted-by":"publisher","first-page":"2147","DOI":"10.1007\/s00203-020-01931-x","volume":"202","author":"E Dekaboruah","year":"2020","unstructured":"Dekaboruah E, Suryavanshi MV, Chettri D, Verma AK (2020) Human microbiome: an academic update on human body site specific surveillance and its possible role. Arch Microbiol 202(8):2147\u20132167. https:\/\/doi.org\/10.1007\/s00203-020-01931-x","journal-title":"Arch Microbiol"},{"issue":"8","key":"5961_CR12","doi-asserted-by":"publisher","first-page":"e023777","DOI":"10.1371\/journal.pone.0237779","volume":"15","author":"M Dong","year":"2020","unstructured":"Dong M, Li Lh, Chen M, Kusalik A, Xu W (2020) Predictive analysis methods for human microbiome data with application to parkinson\u2019s disease. PLoS ONE 15(8):e023777. https:\/\/doi.org\/10.1371\/journal.pone.0237779","journal-title":"PLoS ONE"},{"issue":"5","key":"5961_CR13","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1214\/aos\/1013203451","volume":"29","author":"JH Friedman","year":"2001","unstructured":"Friedman JH (2001) Greedy function approximation: a gradient boosting machine. Ann Stat 29(5):1189\u2013123. https:\/\/doi.org\/10.1214\/aos\/1013203451","journal-title":"Ann Stat"},{"key":"5961_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.ins.2018.06.056","volume":"465","author":"D Georgios","year":"2018","unstructured":"Georgios D, Fernando B, Felix L (2018) Improving imbalanced learning through a heuristic oversampling method based on k-means and smote. Inf Sci 465:1\u20132. https:\/\/doi.org\/10.1016\/j.ins.2018.06.056","journal-title":"Inf Sci"},{"key":"5961_CR15","doi-asserted-by":"publisher","unstructured":"Han H, Wang WY, Mao BH (2005) Borderline-smote: A new over-sampling method in imbalanced data sets learning. In: Advances in Knowledge Discovery and Data Mining, pp 878\u201388https:\/\/doi.org\/10.1007\/11538059_91","DOI":"10.1007\/11538059_91"},{"issue":"18","key":"5961_CR16","doi-asserted-by":"publisher","first-page":"6097","DOI":"10.1007\/s00500-018-3261-3","volume":"23","author":"GL He","year":"2019","unstructured":"He GL, Zhao W, Xia XW, Peng R, Wu XY (2019) An ensemble of shapelet-based classifiers on inter-class and intra-class imbalanced multivariate time series at the early stage. Soft Comput 23(18):6097\u2013611. https:\/\/doi.org\/10.1007\/s00500-018-3261-3","journal-title":"Soft Comput"},{"key":"5961_CR17","doi-asserted-by":"publisher","unstructured":"He HB, Bai Y, Edwardo\u00a0A G, Li ST (2008) Adasyn: Adaptive synthetic sampling approach for imbalanced learning. In: 2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence). pp 1322\u2013132. https:\/\/doi.org\/10.1109\/IJCNN.2008.4633969","DOI":"10.1109\/IJCNN.2008.4633969"},{"issue":"11","key":"5961_CR18","doi-asserted-by":"publisher","first-page":"1270","DOI":"10.1038\/s41592-021-01302-4","volume":"18","author":"JM Johnson","year":"2021","unstructured":"Johnson JM, Khoshgoftaar TM (2021) The class imbalance problem. Nat Methods 18(11):1270\u2013127. https:\/\/doi.org\/10.1038\/s41592-021-01302-4","journal-title":"Nat Methods"},{"key":"5961_CR19","doi-asserted-by":"publisher","unstructured":"Khushi M, Shaukat K, Talha Alam M, Hameed IA, Uddin S, Luo SH, Yang XY, Reyes MC (2021) A comparative performance analysis of data resampling methods on imbalance medical data. IEEE Access 9:109960\u2013109975. https:\/\/doi.org\/10.1109\/ACCESS.2021.3102399","DOI":"10.1109\/ACCESS.2021.3102399"},{"issue":"1","key":"5961_CR20","doi-asserted-by":"publisher","first-page":"180","DOI":"10.13344\/j.microbiol.china.200346","volume":"48","author":"Q Li","year":"2021","unstructured":"Li Q, Yang Y, Wu ZD, Ding T (2021) Review of gut microbiome analysis prediction models and algorithms. Microbiol China 48(1):180\u2013196. https:\/\/doi.org\/10.13344\/j.microbiol.china.200346","journal-title":"Microbiol China"},{"key":"5961_CR21","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/j.ins.2017.05.008","volume":"409\u2013410","author":"WC Lin","year":"2017","unstructured":"Lin WC, Tsai CF, Hu YH, Jhang JS (2017) Clustering-based undersampling in class-imbalanced data. Inf Sci 409\u2013410:17\u201326. https:\/\/doi.org\/10.1016\/j.ins.2017.05.008","journal-title":"Inf Sci"},{"issue":"2","key":"5961_CR22","doi-asserted-by":"publisher","first-page":"539","DOI":"10.1109\/TSMCB.2008.2007853","volume":"39","author":"XY Liu","year":"2009","unstructured":"Liu XY, Wu JX, Zhou ZH (2009) Exploratory undersampling for class-imbalance learning. IEEE Trans Syst Man Cybern B Cybern 39(2):539\u201355. https:\/\/doi.org\/10.1109\/TSMCB.2008.2007853","journal-title":"IEEE Trans Syst Man Cybern B Cybern"},{"key":"5961_CR23","doi-asserted-by":"publisher","unstructured":"Liu ZN, Cao W, Gao ZF, Bian J, Chen HC, Chang Y, Liu TY (2020) Self-paced ensemble for highly imbalanced massive data classification. In: 2020 IEEE 36th International Conference on Data Engineering (ICDE). pp 841\u2013852. https:\/\/doi.org\/10.1109\/ICDE48307.2020.00078","DOI":"10.1109\/ICDE48307.2020.00078"},{"key":"5961_CR24","doi-asserted-by":"publisher","unstructured":"M NM (2002) Clustering large data sets. In: Soft computing approach to pattern recognition and image processing. pp 41\u20136. https:\/\/doi.org\/10.1142\/9789812776235_0003","DOI":"10.1142\/9789812776235_0003"},{"key":"5961_CR25","doi-asserted-by":"publisher","unstructured":"Mohammed R, Rawashdeh J, Abdullah M (2020) Machine learning with oversampling and undersampling techniques: Overview study and experimental results. In: 2020 11th International Conference on Information and Communication Systems (ICICS). pp 243\u20132. https:\/\/doi.org\/10.1109\/ICICS49469.2020.239556","DOI":"10.1109\/ICICS49469.2020.239556"},{"key":"5961_CR26","doi-asserted-by":"publisher","first-page":"106631","DOI":"10.1016\/j.knosys.2020.106631","volume":"212","author":"V Pattaramon","year":"2021","unstructured":"Pattaramon V, Eyad E, Andrei P (2021) On the class overlap problem in imbalanced data classification. Knowl-Based Syst 212:106631. https:\/\/doi.org\/10.1016\/j.knosys.2020.106631","journal-title":"Knowl-Based Syst"},{"issue":"1","key":"5961_CR27","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-019-0197-0","volume":"6","author":"C Shorten","year":"2019","unstructured":"Shorten C, Khoshgoftaar TM (2019) A survey on image data augmentation for deep learning. J Big Data 6(1):1\u20134. https:\/\/doi.org\/10.1186\/s40537-019-0197-0","journal-title":"J Big Data"},{"issue":"6","key":"5961_CR28","doi-asserted-by":"publisher","first-page":"12411","DOI":"10.3233\/JIFS-210555","volume":"40","author":"HY Wang","year":"2021","unstructured":"Wang HY, Wang JS, Zhu LF (2021) A new validity function of fcm clustering algorithm based on intra-class compactness and inter-class separation. J Intell Fuzz Syst 40(6):12411\u201312432. https:\/\/doi.org\/10.3233\/JIFS-210555","journal-title":"J Intell Fuzz Syst"},{"issue":"4","key":"5961_CR29","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1109\/JAS.2017.7510583","volume":"4","author":"KF Wang","year":"2017","unstructured":"Wang KF, Gou C, Duan YJ, Lin YL, Zheng XH, Wang FY (2017) Generative adversarial networks: introduction and outlook. IEEE\/CAA J Automatica Sinica 4(4):588\u201359. https:\/\/doi.org\/10.1109\/JAS.2017.7510583","journal-title":"IEEE\/CAA J Automatica Sinica"},{"key":"5961_CR30","doi-asserted-by":"publisher","DOI":"10.1007\/s13042-023-02047-6","author":"LY Wen","year":"2023","unstructured":"Wen LY, Chen Z, Xie XN, Min F (2023) Microbial data augmentation combining feature extraction and transformer network. Int J Mach Learn Cybern. https:\/\/doi.org\/10.1007\/s13042-023-02047-6","journal-title":"Int J Mach Learn Cybern"},{"key":"5961_CR31","doi-asserted-by":"publisher","unstructured":"Wen LY, Wang X, Min F (2023) Cost-sensitive microbial data augmentation through matrix factorization. Appl Intell 12684\u2013127. https:\/\/doi.org\/10.1007\/s10489-022-04187-8","DOI":"10.1007\/s10489-022-04187-8"},{"key":"5961_CR32","doi-asserted-by":"publisher","unstructured":"Wen LY, Zhang XM, Li QF, Min F (2023) Kga: integrating kpca and gan for microbial data augmentation. Int J Mach Learn Cybern 1427\u2013144. https:\/\/doi.org\/10.1007\/s13042-022-01707-3","DOI":"10.1007\/s13042-022-01707-3"},{"key":"5961_CR33","doi-asserted-by":"publisher","unstructured":"Yang FL, Zou Q (2020) mAML: an automated machine learning pipeline with a microbiome repository for human disease classification. Database 2020. https:\/\/doi.org\/10.1093\/database\/baaa050","DOI":"10.1093\/database\/baaa050"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-024-05961-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-024-05961-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-024-05961-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,2]],"date-time":"2025-01-02T15:13:18Z","timestamp":1735830798000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-024-05961-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,29]]},"references-count":33,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["5961"],"URL":"https:\/\/doi.org\/10.1007\/s10489-024-05961-6","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"type":"print","value":"0924-669X"},{"type":"electronic","value":"1573-7497"}],"subject":[],"published":{"date-parts":[[2024,11,29]]},"assertion":[{"value":"5 October 2024","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 November 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no financial and personal relationships with other people or organizations that can inappropriately influence our work. There is no professional or other personal interest of any nature or kind in any product, service and\/or company that could be construed as influencing the position presented in, or the review of, the manuscript entitled.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}},{"value":"This paper does not contain any studies with animals performed by any of the authors. Informed consent was obtained from all individual participants included in the study.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and Informed Consent"}}],"article-number":"47"}}