{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T05:08:35Z","timestamp":1743138515089,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":10,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819615308"},{"type":"electronic","value":"9789819615315"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-1531-5_46","type":"book-chapter","created":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T14:17:09Z","timestamp":1738937829000},"page":"475-485","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Impact of Imbalanced Data on Apache Spark"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-8552-769X","authenticated-orcid":false,"given":"Thet Hsu","family":"Aung","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0006-6792-6539","authenticated-orcid":false,"given":"Aye Myat Myat","family":"Paing","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,8]]},"reference":[{"key":"46_CR1","doi-asserted-by":"publisher","DOI":"10.1007\/s13755-018-0051-3","volume-title":"The effects of varying class distribution on learner behavior for medicare fraud detection with imbalanced Big Data","author":"R Bauder","year":"2018","unstructured":"Bauder, R., Khoshgoftaar, T.: The effects of varying class distribution on learner behavior for medicare fraud detection with imbalanced Big Data. Florida Alantic University, Boca Raton, USA, College of Engineering and Computer Science (2018)"},{"key":"46_CR2","unstructured":"Isaac, T., Sara del, R., Victoria, L., Jaume, B., Jose, M., Franciso, H.: An extremely imbalanced Big Data bioinformatics problem. Knowledge-based System (2015)"},{"key":"46_CR3","unstructured":"Sankardas, R., Jordan, D., Yuping, L., Herndon, N., Doina, C., Xinming, O.: Experimental study with real-world data for android app security analysis using machine learning. In: Proceedings of the 31st Annual Computer Security Applications Conference (2015)"},{"key":"46_CR4","doi-asserted-by":"crossref","unstructured":"Aaron Richter, N., Taghi Khoshgoftaar, M.: Melanoma Risk Prediction with Structured Electronic Health Records. ACM-BCB (2019)","DOI":"10.1145\/3233547.3233561"},{"key":"46_CR5","unstructured":"Victoria, L., Alberto, F., Salvador, G., Vasile, P., Francisco, H.: An insight into classification with imbalanced data: Empirical results and current trends on using data intrinsic characteristics. Journal of Information Sciences (2013)"},{"key":"46_CR6","unstructured":"Prati, C., Gustavo, E., Maria, M.: learning with Class Skews and Small Disjuncts. Advanced in Artificial Intelligence (2017)"},{"key":"46_CR7","unstructured":"https:\/\/spark.apache.org\/docs\/latest\/index.html"},{"issue":"1","key":"46_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-019-0274-4","volume":"6","author":"T Hasanin","year":"2019","unstructured":"Hasanin, T., Khoshgoftaar, T.M., Leevy, J.L., Bauder, R.A.: Severely imbalanced Big Data challenges: investigating data sampling approaches. J. Big Data 6(1), 1\u201325 (2019). https:\/\/doi.org\/10.1186\/s40537-019-0274-4","journal-title":"J. Big Data"},{"key":"46_CR9","doi-asserted-by":"crossref","unstructured":"Garcia, F., Romulo, A., Giancarlo, L., Eduardo, N.: A performance analysis of classifiers on imbalanced data. In: Proceedings of the 24th International Conference on Enterprise Information Systems (2022)","DOI":"10.5220\/0011089100003179"},{"key":"46_CR10","unstructured":"Tanawan, W., Khamron, S., Nipotepat, M.: Comparative Evaluation of Imbalanced Data Management Techniques for Solving Classification Problems on Imbalanced Datasets. Statics, Optimization, and Information Computing (2024)"}],"container-title":["Lecture Notes in Electrical Engineering","Genetic and Evolutionary Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-1531-5_46","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,7]],"date-time":"2025-02-07T14:17:18Z","timestamp":1738937838000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-1531-5_46"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819615308","9789819615315"],"references-count":10,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-1531-5_46","relation":{},"ISSN":["1876-1100","1876-1119"],"issn-type":[{"type":"print","value":"1876-1100"},{"type":"electronic","value":"1876-1119"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"8 February 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICGEC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Genetic and Evolutionary Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Miyazaki","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Japan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 August 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icgec2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/icgec24.github.io\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}