{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T14:21:27Z","timestamp":1770214887572,"version":"3.49.0"},"publisher-location":"Singapore","reference-count":13,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819557219","type":"print"},{"value":"9789819557226","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-981-95-5722-6_14","type":"book-chapter","created":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T08:14:16Z","timestamp":1769933656000},"page":"175-183","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Resolving Memory Challenges in\u00a0Cluster Computing Systems Via Stratified Asymptotic Sampling for\u00a0Big Data Classification"],"prefix":"10.1007","author":[{"given":"Chenghao","family":"Wei","sequence":"first","affiliation":[]},{"given":"Quan","family":"Li","sequence":"additional","affiliation":[]},{"given":"Chen","family":"Li","sequence":"additional","affiliation":[]},{"given":"PuKai","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,2]]},"reference":[{"key":"14_CR1","doi-asserted-by":"publisher","first-page":"101959","DOI":"10.1016\/j.jocs.2023.101959","volume":"67","author":"DO Cardoso","year":"2023","unstructured":"Cardoso, D.O., Galeno, T.D.: Online evaluation of the Kolmogorov-Smirnov test on arbitrarily large samples. J. Comput. Sci. 67, 101959 (2023)","journal-title":"J. Comput. Sci."},{"key":"14_CR2","unstructured":"Hagen, A., et al.: Accelerated computation of a high dimensional Kolmogorov-Smirnov distance. arXiv preprint arXiv:2106.13706 (2021)"},{"key":"14_CR3","unstructured":"Hagen, A., Strube, J., Haide, I., Kahn, J., Jackson, S., Hainje, C.: A proposed high dimensional Kolmogorov-Smirnov distance. In: Proceedings of the Machine Learning and the Physical Sciences: Workshop at the 34th Conference on Neural Information Processing Systems (NeurIPS), Vancouver, BC, Canada, pp. 6\u201312 (2020)"},{"key":"14_CR4","doi-asserted-by":"crossref","unstructured":"Liang, B., Wu, D.: Memory priority scheduling algorithm for cloud data center based on machine learning dynamic clustering algorithm. IEEE Trans. Industr. Inform. (2025)","DOI":"10.1109\/TII.2025.3528574"},{"key":"14_CR5","doi-asserted-by":"publisher","first-page":"752","DOI":"10.1016\/j.future.2024.06.025","volume":"160","author":"S Lim","year":"2024","unstructured":"Lim, S., Park, D.: Improving Hadoop MapReduce performance on heterogeneous single board computer clusters. Futur. Gener. Comput. Syst. 160, 752\u2013766 (2024)","journal-title":"Futur. Gener. Comput. Syst."},{"key":"14_CR6","doi-asserted-by":"crossref","unstructured":"Liu, D., Li, Z., Zhang, Z.: Echo: adaptive correction for subgraph-wise sampling with lightweight hyperparameter search. In: Asia-Pacific Web (APWeb) and Web-Age Information Management (WAIM) Joint International Conference on Web and Big Data, pp. 179\u2013194. Springer (2024)","DOI":"10.1007\/978-981-97-7244-5_12"},{"issue":"2","key":"14_CR7","doi-asserted-by":"publisher","first-page":"85","DOI":"10.26599\/BDMA.2019.9020015","volume":"3","author":"MS Mahmud","year":"2020","unstructured":"Mahmud, M.S., Huang, J.Z., Salloum, S., Emara, T.Z., Sadatdiynov, K.: A survey of data partitioning and sampling methods to support big data analysis. Big Data Min. Anal. 3(2), 85\u2013101 (2020)","journal-title":"Big Data Min. Anal."},{"key":"14_CR8","doi-asserted-by":"publisher","first-page":"111321","DOI":"10.1016\/j.patcog.2024.111321","volume":"161","author":"MS Mahmud","year":"2025","unstructured":"Mahmud, M.S., Zheng, H., Garcia-Gil, D., Garc\u00eda, S., Huang, J.Z.: RSPCA: random sample partition and clustering approximation for ensemble learning of big data. Pattern Recogn. 161, 111321 (2025)","journal-title":"Pattern Recogn."},{"issue":"9","key":"14_CR9","first-page":"35","volume":"4","author":"C Perera","year":"2024","unstructured":"Perera, C., et al.: Optimizing performance in parallel and distributed computing systems for large-scale applications. J. Adv. Comput. Syst. 4(9), 35\u201344 (2024)","journal-title":"J. Adv. Comput. Syst."},{"key":"14_CR10","doi-asserted-by":"publisher","first-page":"111638","DOI":"10.1016\/j.asoc.2024.111638","volume":"159","author":"L Qin","year":"2024","unstructured":"Qin, L., Wang, X., Yin, L., Jiang, Z.: A distributed evolutionary based instance selection algorithm for big data using apache spark. Appl. Soft Comput. 159, 111638 (2024)","journal-title":"Appl. Soft Comput."},{"issue":"143","key":"14_CR11","first-page":"1","volume":"12","author":"H Soudabeh","year":"2023","unstructured":"Soudabeh, H., Neda, M., Tobias, O., Fredrik, A., Mahdi, S., Kamal, B.: MapReduce scheduling algorithms in Hadoop: a systematic study. J. Cloud Comput. 12(143), 1\u201330 (2023)","journal-title":"J. Cloud Comput."},{"issue":"2","key":"14_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10723-023-09653-2","volume":"21","author":"MT Wu","year":"2023","unstructured":"Wu, M.T., Zhou, H., Lin, J.C.W., Srivastava, G., Baza, M.: Mining skyline patterns from big data environments based on a spark framework. J. Grid Comput. 21(2), 1\u201319 (2023)","journal-title":"J. Grid Comput."},{"issue":"5","key":"14_CR13","doi-asserted-by":"publisher","first-page":"3719","DOI":"10.1007\/s10586-022-03597-0","volume":"25","author":"L Yun","year":"2022","unstructured":"Yun, L., Xiao, Z., Binbin, L., Xiaonan, Z.: The research and analysis of efficiency of hardware usage base on HDFs. Clust. Comput. 25(5), 3719\u20133732 (2022)","journal-title":"Clust. Comput."}],"container-title":["Lecture Notes in Computer Science","Web and Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-5722-6_14","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T08:14:18Z","timestamp":1769933658000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-5722-6_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9789819557219","9789819557226"],"references-count":13,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-5722-6_14","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"2 February 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"APWeb-WAIM","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Asia-Pacific Web (APWeb) and Web-Age Information Management (WAIM) Joint International Conference on Web and Big Data","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Shenyang","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 August 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"apwebwaim2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/apweb2025.sau.edu.cn\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}