{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:49:35Z","timestamp":1742914175812,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":48,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819722402"},{"type":"electronic","value":"9789819722389"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-981-97-2238-9_21","type":"book-chapter","created":{"date-parts":[[2024,4,30]],"date-time":"2024-04-30T12:01:48Z","timestamp":1714478508000},"page":"271-283","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A Data-Driven Approach for\u00a0Building a\u00a0Cardiovascular Disease Risk Prediction System"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3062-5282","authenticated-orcid":false,"given":"Hongkuan","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9814-6029","authenticated-orcid":false,"given":"Raymond K.","family":"Wong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7229-7614","authenticated-orcid":false,"given":"Kwok Leung","family":"Ong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,5,1]]},"reference":[{"issue":"1","key":"21_CR1","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1186\/s13040-022-00300-2","volume":"15","author":"A Romero","year":"2022","unstructured":"Romero, A., et al.: Benchmarking automl frameworks for disease prediction using medical claims. BioData Mining 15(1), 15 (2022)","journal-title":"BioData Mining"},{"key":"21_CR2","doi-asserted-by":"publisher","DOI":"10.3389\/fcvm.2022.840262","volume":"9","author":"S Amal","year":"2022","unstructured":"Amal, S., Safarnejad, L., Omiye, J.A., Ghanzouri, I., Cabot, J.H., Ross, E.G.: Use of multi-modal data and machine learning to improve cardiovascular disease care. Front. Cardiovascular Med. 9, 840262 (2022)","journal-title":"Front. Cardiovascular Med."},{"key":"21_CR3","doi-asserted-by":"publisher","first-page":"13527","DOI":"10.1109\/ACCESS.2020.2966296","volume":"8","author":"P Barbara","year":"2020","unstructured":"Barbara, P.: Learning from high-dimensional biomedical datasets: The issue of class imbalance. IEEE Access 8, 13527\u201313540 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.2966296","journal-title":"IEEE Access"},{"issue":"2","key":"21_CR4","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1109\/TKDE.2012.232","volume":"26","author":"S Barua","year":"2012","unstructured":"Barua, S., Islam, M.M., Yao, X., Murase, K.: Mwmote-majority weighted minority oversampling technique for imbalanced data set learning. IEEE Trans. Knowl. Data Eng. 26(2), 405\u2013425 (2012)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"251\u2013260","key":"21_CR5","first-page":"48","volume":"87","author":"GE Batista","year":"2002","unstructured":"Batista, G.E., Monard, M.C., et al.: A study of k-nearest neighbour as an imputation method. His 87(251\u2013260), 48 (2002)","journal-title":"His"},{"issue":"1","key":"21_CR6","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1186\/1471-2288-14-118","volume":"14","author":"ML Bell","year":"2014","unstructured":"Bell, M.L., Fiero, M., Horton, N.J., Hsu, C.H.: Handling missing data in rcts; a review of the top medical journals. BMC Med. Res. Methodol. 14(1), 118 (2014)","journal-title":"BMC Med. Res. Methodol."},{"key":"21_CR7","doi-asserted-by":"crossref","unstructured":"Boser, B.E., Guyon, I.M., Vapnik, V.N.: A training algorithm for optimal margin classifiers. In: Proceedings of the Fifth Annual Workshop on Computational Learning Theory, pp. 144\u2013152 (1992)","DOI":"10.1145\/130385.130401"},{"issue":"2","key":"21_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2907070","volume":"49","author":"P Branco","year":"2016","unstructured":"Branco, P., Torgo, L., Ribeiro, R.P.: A survey of predictive modeling on imbalanced domains. ACM Comput. Surv. (CSUR) 49(2), 1\u201350 (2016)","journal-title":"ACM Comput. Surv. (CSUR)"},{"key":"21_CR9","doi-asserted-by":"publisher","unstructured":"Branco, P., Torgo, L., Ribeiro, R.P.: A survey of predictive modeling on imbalanced domains. ACM Comput. Surv. 49(2) (2016).https:\/\/doi.org\/10.1145\/2907070","DOI":"10.1145\/2907070"},{"key":"21_CR10","doi-asserted-by":"crossref","unstructured":"Brazdil, P., Carrier, C.G., Soares, C., Vilalta, R.: Metalearning: Applications to data mining. Springer Science & Business Media (2008)","DOI":"10.1007\/978-3-540-73263-1"},{"key":"21_CR11","unstructured":"Burda, Y., Grosse, R., Salakhutdinov, R.: Importance weighted autoencoders. arXiv preprint arXiv:1509.00519 (2015)"},{"issue":"3","key":"21_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v045.i03","volume":"45","author":"S van Buuren","year":"2011","unstructured":"van Buuren, S., Groothuis-Oudshoorn, K.: mice: Multivariate imputation by chained equations in r. J. Stat. Softw. 45(3), 1\u201367 (2011)","journal-title":"J. Stat. Softw."},{"key":"21_CR13","unstructured":"CDC: National health and nutrition examination survey (2022). http:\/\/www.cdc.gov\/nchs\/nhanes\/about_nhanes.html"},{"issue":"6","key":"21_CR14","doi-asserted-by":"publisher","first-page":"2083","DOI":"10.1007\/s10994-022-06282-w","volume":"112","author":"V Cerqueira","year":"2023","unstructured":"Cerqueira, V., Torgo, L., Branco, P., Bellinger, C.: Automated imbalanced classification via layered learning. Mach. Learn. 112(6), 2083\u20132104 (2023)","journal-title":"Mach. Learn."},{"key":"21_CR15","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla, N.V., Bowyer, K.W., Hall, L.O., Kegelmeyer, W.P.: Smote: synthetic minority over-sampling technique. J. Artifi. Intell. Res. 16, 321\u2013357 (2002)","journal-title":"J. Artifi. Intell. Res."},{"key":"21_CR16","doi-asserted-by":"crossref","unstructured":"Chen, T., Guestrin, C.: Xgboost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 785\u2013794 (2016)","DOI":"10.1145\/2939672.2939785"},{"issue":"2","key":"21_CR17","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1111\/j.2517-6161.1958.tb00292.x","volume":"20","author":"DR Cox","year":"1958","unstructured":"Cox, D.R.: The regression analysis of binary sequences. J. R. Stat. Soc. Ser. B Stat Methodol. 20(2), 215\u2013232 (1958)","journal-title":"J. R. Stat. Soc. Ser. B Stat Methodol."},{"key":"21_CR18","unstructured":"Drori, I., et al.: Alphad3m: machine learning pipeline synthesis. arXiv preprint arXiv:2111.02508 (2021)"},{"key":"21_CR19","unstructured":"Feurer, M., Klein, A., Eggensperger, K., Springenberg, J., Blum, M., Hutter, F.: Efficient and robust automated machine learning. In: Advances in Neural Information Processing Systems 28, pp. 2962\u20132970 (2015)"},{"key":"21_CR20","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1472-6947-12-8","volume":"12","author":"RL Figueroa","year":"2012","unstructured":"Figueroa, R.L., Zeng-Treitler, Q., Kandula, S., Ngo, L.H.: Predicting sample size required for classification performance. BMC Med. Inform. Decis. Mak. 12, 1\u201310 (2012)","journal-title":"BMC Med. Inform. Decis. Mak."},{"issue":"1","key":"21_CR21","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y Freund","year":"1997","unstructured":"Freund, Y., Schapire, R.E.: A decision-theoretic generalization of on-line learning and an application to boosting. J. Comput. Syst. Sci. 55(1), 119\u2013139 (1997)","journal-title":"J. Comput. Syst. Sci."},{"key":"21_CR22","doi-asserted-by":"crossref","unstructured":"Fuse, H., Oishi, K., Maikusa, N., Fukami, T., Initiative, J.A.D.N.: Detection of alzheimer\u2019s disease with shape analysis of mri images, pp. 1031\u20131034 (2018)","DOI":"10.1109\/SCIS-ISIS.2018.00171"},{"issue":"8","key":"21_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/LSENS.2020.3006756","volume":"4","author":"B Ganguly","year":"2020","unstructured":"Ganguly, B., Ghosal, A., Das, A., Das, D., Chatterjee, D., Rakshit, D.: Automated detection and classification of arrhythmia from ecg signals using feature-induced long short-term memory network. IEEE Sensors Lett. 4(8), 1\u20134 (2020)","journal-title":"IEEE Sensors Lett."},{"key":"21_CR24","doi-asserted-by":"crossref","unstructured":"Hutter, F., Kotthoff, L., Vanschoren, J.: Automated machine learning: methods, systems, challenges. Springer Nature (2019)","DOI":"10.1007\/978-3-030-05318-5"},{"key":"21_CR25","doi-asserted-by":"crossref","unstructured":"Jinjri, W.M., Keikhosrokiani, P., Abdullah, N.L.: Machine learning algorithms for the classification of cardiovascular disease- a comparative study. In: 2021 International Conference on Information Technology (ICIT), pp. 132\u2013138 (2021)","DOI":"10.1109\/ICIT52682.2021.9491677"},{"key":"21_CR26","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1613\/jair.301","volume":"4","author":"LP Kaelbling","year":"1996","unstructured":"Kaelbling, L.P., Littman, M.L., Moore, A.W.: Reinforcement learning: a survey. J. Artifi. Intell. Res. 4, 237\u2013285 (1996)","journal-title":"J. Artifi. Intell. Res."},{"key":"21_CR27","first-page":"23806","volume":"34","author":"T Kyono","year":"2021","unstructured":"Kyono, T., Zhang, Y., Bellot, A., van der Schaar, M.: Miracle: causally-aware imputation via learning missing data mechanisms. Adv. Neural. Inf. Process. Syst. 34, 23806\u201323817 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"21_CR28","doi-asserted-by":"publisher","first-page":"7869","DOI":"10.1109\/ACCESS.2020.3047942","volume":"9","author":"TM Le","year":"2021","unstructured":"Le, T.M., Vo, T.M., Pham, T.N., Dao, S.V.T.: A novel wrapper-based feature selection for early diabetes prediction enhanced with a metaheuristic. IEEE Access 9, 7869\u20137884 (2021)","journal-title":"IEEE Access"},{"key":"21_CR29","unstructured":"LeDell, E., Poirier, S.: H2o automl: Scalable automatic machine learning. In: Proceedings of the AutoML Workshop at ICML, vol.\u00a02020. ICML (2020)"},{"issue":"9","key":"21_CR30","doi-asserted-by":"publisher","first-page":"9776","DOI":"10.3390\/ijerph110909776","volume":"11","author":"PH Lee","year":"2014","unstructured":"Lee, P.H.: Resampling methods improve the predictive power of modeling in class-imbalanced datasets. Int. J. Environ. Res. Public Health 11(9), 9776\u20139789 (2014)","journal-title":"Int. J. Environ. Res. Public Health"},{"key":"21_CR31","unstructured":"Mattei, P.A., Frellsen, J.: Miwae: deep generative modelling and imputation of incomplete data sets. In: International Conference on Machine Learning, pp. 4413\u20134423. PMLR (2019)"},{"key":"21_CR32","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1007\/s10618-012-0295-5","volume":"28","author":"G Menardi","year":"2014","unstructured":"Menardi, G., Torelli, N.: Training and assessing classification rules with imbalanced data. Data Min. Knowl. Disc. 28, 92\u2013122 (2014)","journal-title":"Data Min. Knowl. Disc."},{"key":"21_CR33","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.115011","volume":"178","author":"N Moniz","year":"2021","unstructured":"Moniz, N., Cerqueira, V.: Automated imbalanced classification via meta-learning. Expert Syst. Appl. 178, 115011 (2021)","journal-title":"Expert Syst. Appl."},{"key":"21_CR34","doi-asserted-by":"crossref","unstructured":"Mustafa, A., Rahimi Azghadi, M.: Automated machine learning for healthcare and clinical notes analysis. Computers 10(2), 24 (2021). https:\/\/www.mdpi.com\/2073-431X\/10\/2\/24","DOI":"10.3390\/computers10020024"},{"key":"21_CR35","doi-asserted-by":"crossref","unstructured":"Nguyen, H.M., Cooper, E.W., Kamei, K.: A comparative study on sampling techniques for handling class imbalance in streaming data. In: The 6th International Conference on Soft Computing and Intelligent Systems, and The 13th International Symposium on Advanced Intelligence Systems, pp. 1762\u20131767. IEEE (2012)","DOI":"10.1109\/SCIS-ISIS.2012.6505291"},{"key":"21_CR36","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/978-3-319-31204-0_9","volume-title":"Applications of Evolutionary Computation","author":"RS Olson","year":"2016","unstructured":"Olson, R.S., Urbanowicz, R.J., Andrews, P.C., Lavender, N.A., Kidd, L.C., Moore, J.H.: Automating biomedical data science through tree-based pipeline optimization. In: Squillero, G., Burelli, P. (eds.) EvoApplications 2016. LNCS, vol. 9597, pp. 123\u2013137. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-31204-0_9"},{"key":"21_CR37","doi-asserted-by":"publisher","unstructured":"Pes, B.: Handling class imbalance in high-dimensional biomedical datasets, pp. 150\u2013155 (2019). https:\/\/doi.org\/10.1109\/WETICE.2019.00040","DOI":"10.1109\/WETICE.2019.00040"},{"key":"21_CR38","doi-asserted-by":"crossref","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J., et\u00a0al.: Learning internal representations by error propagation (1985)","DOI":"10.21236\/ADA164453"},{"key":"21_CR39","doi-asserted-by":"publisher","unstructured":"Shastry, K.A., Sanjay, H.A.: Machine Learning for Bioinformatics, pp. 25\u201339. Springer Singapore, Singapore (2020). https:\/\/doi.org\/10.1007\/978-981-15-2445-5_3","DOI":"10.1007\/978-981-15-2445-5_3"},{"key":"21_CR40","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"369","DOI":"10.1007\/3-540-45164-1_38","volume-title":"Machine Learning: ECML 2000","author":"P Stone","year":"2000","unstructured":"Stone, P., Veloso, M.: Layered learning. In: L\u00f3pez de M\u00e1ntaras, R., Plaza, E. (eds.) ECML 2000. LNCS (LNAI), vol. 1810, pp. 369\u2013381. Springer, Heidelberg (2000). https:\/\/doi.org\/10.1007\/3-540-45164-1_38"},{"issue":"10","key":"21_CR41","doi-asserted-by":"publisher","first-page":"890","DOI":"10.1109\/32.962560","volume":"27","author":"K Strike","year":"2001","unstructured":"Strike, K., El Emam, K., Madhavji, N.: Software cost estimation with incomplete data. IEEE Trans. Software Eng. 27(10), 890\u2013908 (2001)","journal-title":"IEEE Trans. Software Eng."},{"key":"21_CR42","doi-asserted-by":"crossref","unstructured":"Thornton, C., Hutter, F., Hoos, H.H., Leyton-Brown, K.: Auto-weka: combined selection and hyperparameter optimization of classification algorithms. In: Proceedings of the 19th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 847\u2013855 (2013)","DOI":"10.1145\/2487575.2487629"},{"key":"21_CR43","doi-asserted-by":"publisher","DOI":"10.1016\/j.artmed.2020.101822","volume":"104","author":"J Waring","year":"2020","unstructured":"Waring, J., Lindvall, C., Umeton, R.: Automated machine learning: review of the state-of-the-art and opportunities for healthcare. Artif. Intell. Med. 104, 101822 (2020). https:\/\/doi.org\/10.1016\/j.artmed.2020.101822","journal-title":"Artif. Intell. Med."},{"key":"21_CR44","unstructured":"WHO: (2021). https:\/\/www.who.int\/news-room\/fact-sheets\/detail\/cardiovascular-diseases-(cvds)"},{"key":"21_CR45","unstructured":"Yoon, J., Jordon, J., van\u00a0der Schaar, M.: GAIN: missing data imputation using generative adversarial nets. In: Dy, J., Krause, A. (eds.) Proceedings of the 35th International Conference on Machine Learning. Proceedings of Machine Learning Research, vol.\u00a080, pp. 5689\u20135698. PMLR (10\u201315 Jul 2018). https:\/\/proceedings.mlr.press\/v80\/yoon18a.html"},{"key":"21_CR46","doi-asserted-by":"publisher","unstructured":"Yuan, L.: Evaluating the state of the art in missing data imputation for clinical data. Briefings Bioinform. 23(1), bbab489 (2022). https:\/\/doi.org\/10.1093\/bib\/bbab489","DOI":"10.1093\/bib\/bbab489"},{"key":"21_CR47","doi-asserted-by":"crossref","unstructured":"Zha, D., Lai, K.H., Tan, Q., Ding, S., Zou, N., Hu, X.B.: Towards automated imbalanced learning with deep hierarchical reinforcement learning. In: Proceedings of the 31st ACM International Conference on Information & Knowledge Management, pp. 2476\u20132485 (2022)","DOI":"10.1145\/3511808.3557474"},{"key":"21_CR48","doi-asserted-by":"publisher","first-page":"409","DOI":"10.1613\/jair.1.11854","volume":"70","author":"MA Z\u00f6ller","year":"2021","unstructured":"Z\u00f6ller, M.A., Huber, M.F.: Benchmark and survey of automated machine learning frameworks. J. Artifi. Intell. Res. 70, 409\u2013472 (2021)","journal-title":"J. Artifi. Intell. Res."}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-97-2238-9_21","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,30]],"date-time":"2024-04-30T12:09:16Z","timestamp":1714478956000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-97-2238-9_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9789819722402","9789819722389"],"references-count":48,"URL":"https:\/\/doi.org\/10.1007\/978-981-97-2238-9_21","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"1 May 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PAKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Pacific-Asia Conference on Knowledge Discovery and Data Mining","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taipei","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taiwan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 May 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 May 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"pakdd2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/pakdd2024.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}