{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,2]],"date-time":"2026-02-02T20:36:03Z","timestamp":1770064563171,"version":"3.49.0"},"reference-count":71,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,8,23]],"date-time":"2022-08-23T00:00:00Z","timestamp":1661212800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,8,23]],"date-time":"2022-08-23T00:00:00Z","timestamp":1661212800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Wireless Pers Commun"],"published-print":{"date-parts":[[2022,10]]},"DOI":"10.1007\/s11277-021-09362-7","type":"journal-article","created":{"date-parts":[[2022,8,23]],"date-time":"2022-08-23T09:03:05Z","timestamp":1661245385000},"page":"2403-2423","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["Performance Evaluation of Data-driven Intelligent Algorithms for Big data Ecosystem"],"prefix":"10.1007","volume":"126","author":[{"given":"Muhammad","family":"Junaid","sequence":"first","affiliation":[]},{"given":"Sajid","family":"Ali","sequence":"additional","affiliation":[]},{"given":"Isma Farah","family":"Siddiqui","sequence":"additional","affiliation":[]},{"given":"Choonsung","family":"Nam","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5035-2640","authenticated-orcid":false,"given":"Nawab Muhammad Faseeh","family":"Qureshi","sequence":"additional","affiliation":[]},{"given":"Jaehyoun","family":"Kim","sequence":"additional","affiliation":[]},{"given":"Dong Ryeol","family":"Shin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,8,23]]},"reference":[{"key":"9362_CR1","doi-asserted-by":"crossref","unstructured":"D\u2019silva, G.M., Khan, A., & Bari, S., et\u00a0al. Real-time processing of iot events with historic data using apache kafka and apache spark with dashing framework, in 2017 2nd IEEE International Conference on Recent Trends in Electronics, Information & Communication Technology (RTEICT) (IEEE, 2017), pp. 1804\u20131809","DOI":"10.1109\/RTEICT.2017.8256910"},{"key":"9362_CR2","doi-asserted-by":"crossref","unstructured":"Maheshwar, R.C., & Haritha, D. Survey on high performance analytics of bigdata with apache spark, in 2016 International Conference on Advanced Communication Control and Computing Technologies (ICACCCT) (IEEE, 2016), pp. 721\u2013725","DOI":"10.1109\/ICACCCT.2016.7831734"},{"key":"9362_CR3","unstructured":"Al-Barznji, K., & Atanassov, A. (2018). Big Data Sentiment Analysis Using Machine Learning Algorithms, in Proceedings of 26th International Symposium\u201d Control of Energy, Industrial and Ecological Systems, Bankia, Bulgaria (2018)"},{"issue":"2","key":"9362_CR4","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/j.bdr.2015.01.005","volume":"2","author":"HV Jagadish","year":"2015","unstructured":"Jagadish, H. V. (2015). Big data and science: Myths and reality. Big Data Research, 2(2), 49.","journal-title":"Big Data Research"},{"key":"9362_CR5","doi-asserted-by":"crossref","unstructured":"Kejela, G., Esteves, R.M., & Rong, C. Predictive analytics of sensor data using distributed machine learning techniques, in 2014 IEEE 6th international conference on cloud computing technology and science (IEEE, 2014), pp. 626\u2013631","DOI":"10.1109\/CloudCom.2014.44"},{"key":"9362_CR6","doi-asserted-by":"publisher","first-page":"350","DOI":"10.1016\/j.neucom.2017.01.026","volume":"237","author":"L Zhou","year":"2017","unstructured":"Zhou, L., Pan, S., Wang, J., & Vasilakos, A. V. (2017). Machine learning on big data: Opportunities and challenges. Neurocomputing, 237, 350.","journal-title":"Neurocomputing"},{"key":"9362_CR7","unstructured":"\u201d. Seagate . https:\/\/www.seagate.com\/nl\/nl\/our-story\/"},{"key":"9362_CR8","doi-asserted-by":"crossref","unstructured":"Assefi, M., Behravesh, E., Liu, G., & Tafti, A.P. Big data machine learning using apache spark MLlib, in 2017 IEEE International Conference on Big Data (Big Data) (IEEE, 2017), pp. 3492\u20133498","DOI":"10.1109\/BigData.2017.8258338"},{"key":"9362_CR9","doi-asserted-by":"publisher","unstructured":"Aziz, K., Zaidouni, D., & Bellafkih, M. Real-time data analysis using Spark and Hadoop, in 2018 4th International Conference on Optimization and Applications (ICOA) (2018), pp. 1\u20136. https:\/\/doi.org\/10.1109\/ICOA.2018.8370593","DOI":"10.1109\/ICOA.2018.8370593"},{"key":"9362_CR10","unstructured":"Shoro, A. G & Soomro, T. R. (2015). \u201cBig data analysis: Apache spark perspective\u201d, Global Journal of Computer Science and Technology, 15(1)."},{"key":"9362_CR11","doi-asserted-by":"publisher","unstructured":"Armbrust, M., Das, T., Torres, J., Yavuz, B., Zhu, S., Xin, R., Ghodsi, A., Stoica, I., Zaharia, M. (2018). Structured Streaming: A Declarative API for Real-Time Applications in Apache Spark, in Proceedings of the 2018 International Conference on Management of Data (2018), SIGMOD \u201918, p. 601\u2013613. https:\/\/doi.org\/10.1145\/3183713.3190664","DOI":"10.1145\/3183713.3190664"},{"key":"9362_CR12","doi-asserted-by":"publisher","first-page":"7776","DOI":"10.1109\/ACCESS.2017.2696365","volume":"5","author":"A L\u2019heureux","year":"2017","unstructured":"L\u2019heureux, A., Grolinger, K., Elyamany, H. F., & Capretz, M. A. (2017). Machine learning with big data: Challenges and approaches. IEEE Access, 5, 7776.","journal-title":"IEEE Access"},{"key":"9362_CR13","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1016\/j.procs.2015.07.286","volume":"53","author":"JL Reyes-Ortiz","year":"2015","unstructured":"Reyes-Ortiz, J. L., Oneto, L., & Anguita, D. (2015). Big data analytics in the cloud: Spark on hadoop vs mpi\/openmp on beowulf. Procedia Computer Science, 53, 121.","journal-title":"Procedia Computer Science"},{"issue":"6","key":"9362_CR14","first-page":"195","volume":"4","author":"P Dahiya","year":"2017","unstructured":"Dahiya, P., Chaitra, B., & Kumari, U. (2017). Survey on big data using Apache Hadoop and Spark. International Journal of Computer Engineering In Research Trends, 4(6), 195.","journal-title":"International Journal of Computer Engineering In Research Trends"},{"key":"9362_CR15","unstructured":"Bhat, H. S., Madushani, R., & Rawat, S. (2016). Scalable SDE filtering and inference with Apache Spark, in Workshop on Big Data, Streams and Heterogeneous Source Mining: Algorithms (pp. 18\u201334). Systems: Programming Models and Applications (PMLR."},{"key":"9362_CR16","doi-asserted-by":"crossref","unstructured":"Archenaa, J., & Anita, E.M. Interactive big data management in healthcare using spark, in Proceedings of the 3rd International Symposium on Big Data and Cloud Computing Challenges (ISBCC\u201316\u2019) (Springer, 2016), pp. 265\u2013272","DOI":"10.1007\/978-3-319-30348-2_21"},{"key":"9362_CR17","first-page":"1","volume":"40","author":"J Ryan","year":"2016","unstructured":"Ryan, J. (2016). Rapidminer for text analytic fundamentals. Text Mining and Visualization: Case Studies Using Open-Source Tools, 40, 1.","journal-title":"Text Mining and Visualization: Case Studies Using Open-Source Tools"},{"key":"9362_CR18","doi-asserted-by":"crossref","unstructured":"Ding, D., Wu, D., & Yu, F. An overview on cloud computing platform spark for Human Genome mining, in 2016 IEEE International Conference on Mechatronics and Automation (IEEE, 2016), pp. 2605\u20132610","DOI":"10.1109\/ICMA.2016.7558977"},{"key":"9362_CR19","doi-asserted-by":"crossref","unstructured":"Qureshi, N. M. F., Siddiqui, I. F., Abbas, A. et al. (2021). Stream-based authentication strategy using iot sensor data in multi-homing sub-aqueous big data network. Wireless Personal Communications, 116, 1217\u20131229.","DOI":"10.1007\/s11277-020-07215-3"},{"key":"9362_CR20","doi-asserted-by":"crossref","unstructured":"Park, W., Siddiqui, I. F., Chakraborty, C., Qureshi, N. M. F., & Shin, D. R. (2022). Scarcity-aware spam detection technique for big data ecosystem. Pattern Recognition Letters, 157, 67\u201375.","DOI":"10.1016\/j.patrec.2022.03.021"},{"key":"9362_CR21","unstructured":"Jungermann, F. Information extraction with rapidminer, in Proceedings of the GSCL Symposium\u2019Sprachtechnologie und eHumanities (Citeseer, 2009), pp. 50\u201361"},{"key":"9362_CR22","doi-asserted-by":"publisher","unstructured":"G.M. D\u2019silva, A.\u00a0Khan, Gaurav, S.\u00a0Bari, Real-time processing of IoT events with historic data using Apache Kafka and Apache Spark with dashing framework, in 2017 2nd IEEE International Conference on Recent Trends in Electronics, Information Communication Technology (RTEICT) (2017), pp. 1804\u20131809. https:\/\/doi.org\/10.1109\/RTEICT.2017.8256910","DOI":"10.1109\/RTEICT.2017.8256910"},{"key":"9362_CR23","doi-asserted-by":"publisher","unstructured":"Maheshwar, R.C., & Haritha, D. (2016). Survey on high performance analytics of bigdata with apache spark, in 2016 International Conference on Advanced Communication Control and Computing Technologies (ICACCCT) , pp. 721\u2013725. https:\/\/doi.org\/10.1109\/ICACCCT.2016.7831734","DOI":"10.1109\/ICACCCT.2016.7831734"},{"key":"9362_CR24","unstructured":"Tang, S., He, B., Yu, C., Li, Y., & Li, K. (2018). A survey on spark ecosystem for big data processing, arXiv preprint arXiv:1811.08834"},{"issue":"3","key":"9362_CR25","first-page":"93","volume":"4","author":"VS Jonnalagadda","year":"2016","unstructured":"Jonnalagadda, V. S., Srikanth, P., Thumati, K., & Nallamala, S. H. (2016). A review study of apache spark in big data processing. International Journal of Computer Science Trends and Technology (IJCST), 4(3), 93.","journal-title":"International Journal of Computer Science Trends and Technology (IJCST)"},{"issue":"11","key":"9362_CR26","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1145\/2934664","volume":"59","author":"M Zaharia","year":"2016","unstructured":"Zaharia, M., Xin, R. S., Wendell, P., Das, T., Armbrust, M., Dave, A., et al. (2016). Apache spark: A unified engine for big data processing. Communications of the ACM, 59(11), 56.","journal-title":"Communications of the ACM"},{"key":"9362_CR27","doi-asserted-by":"crossref","unstructured":"Athmaja, S., Hanumanthappa, M., & Kavitha, V. A survey of machine learning algorithms for big data analytics, in 2017 International Conference on Innovations in Information, Embedded and Communication Systems (ICIIECS) (IEEE, 2017), pp. 1\u20134","DOI":"10.1109\/ICIIECS.2017.8276028"},{"key":"9362_CR28","doi-asserted-by":"crossref","unstructured":"Venkataraman, S., Panda, A., Ousterhout, K., Armbrust, M., Ghodsi, A., Franklin, M.J., Recht, B., & Stoica, I. (2017). Drizzle: Fast and adaptable stream processing at scale, in Proceedings of the 26th Symposium on Operating Systems Principles , pp. 374\u2013389","DOI":"10.1145\/3132747.3132750"},{"key":"9362_CR29","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1016\/j.procs.2018.10.166","volume":"141","author":"S Al-Saqqa","year":"2018","unstructured":"Al-Saqqa, S., Al-Naymat, G., & Awajan, A. (2018). A large-scale sentiment data classification for online reviews under apache spark. Procedia Computer Science, 141, 183.","journal-title":"Procedia Computer Science"},{"key":"9362_CR30","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.cosrev.2015.05.002","volume":"17","author":"CK Emani","year":"2015","unstructured":"Emani, C. K., Cullot, N., & Nicolle, C. (2015). Understandable big data: A survey. Computer Science Review, 17, 70.","journal-title":"Computer Science Review"},{"issue":"1","key":"9362_CR31","doi-asserted-by":"publisher","first-page":"7","DOI":"10.24017\/science.2019.1.2","volume":"4","author":"HK Omar","year":"2019","unstructured":"Omar, H. K., & Jumaa, A. K. (2019). Big Data Analysis Using Apache Spark MLlib and Hadoop HDFS with scala and java. Kurdistan Journal of Applied Research, 4(1), 7.","journal-title":"Kurdistan Journal of Applied Research"},{"key":"9362_CR32","doi-asserted-by":"crossref","unstructured":"Hafez, M.M., Shehab, M.E., El\u00a0Fakharany, & E., et\u00a0al. Effective selection of machine learning algorithms for big data analytics using apache spark, in International Conference on Advanced Intelligent Systems and Informatics (Springer, 2016), pp. 692\u2013704","DOI":"10.1007\/978-3-319-48308-5_66"},{"key":"9362_CR33","doi-asserted-by":"crossref","unstructured":"Qureshi, N.M.F., Bashir, A.K., Siddiqui, I.F., Abbas, A., Choi, K., & Shin, D.R. A knowledge-based path optimization technique for cognitive nodes in smart grid, in 2018 IEEE global communications conference (GLOBECOM) (IEEE, 2018), pp. 1\u20136","DOI":"10.1109\/GLOCOM.2018.8648016"},{"issue":"1","key":"9362_CR34","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1007\/s11277-019-06264-7","volume":"106","author":"IF Siddiqui","year":"2019","unstructured":"Siddiqui, I. F., Qureshi, N. M. F., Chowdhry, B. S., & Uqaili, M. A. (2019). Edge-node-aware adaptive data processing framework for smart grid. Wireless Personal Communications, 106(1), 179.","journal-title":"Wireless Personal Communications"},{"key":"9362_CR35","doi-asserted-by":"crossref","unstructured":"Qureshi, N.M.F., Siddiqui, I.F., Abbas, A., Bashir, A.K., Choi, K., Kim, J., & Shin, D.R. Dynamic container-based resource management framework of spark ecosystem, in 2019 21st international conference on advanced communication technology (ICACT) (IEEE, 2019), pp. 522\u2013526","DOI":"10.23919\/ICACT.2019.8701970"},{"key":"9362_CR36","unstructured":"pyspark.mllib package \u2013 PySpark 2.0.0 documentation. https:\/\/spark.apache.org\/docs\/2.0.0\/api\/python\/pyspark.mllib.html"},{"issue":"3","key":"9362_CR37","doi-asserted-by":"publisher","first-page":"1495","DOI":"10.1007\/s11277-020-07312-3","volume":"113","author":"IF Siddiqui","year":"2020","unstructured":"Siddiqui, I. F., Qureshi, N. M. F., Chowdhry, B. S., & Uqaili, M. A. (2020). Pseudo-cache-based IoT small files management framework in HDFS cluster. Wireless Personal Communications, 113(3), 1495.","journal-title":"Wireless Personal Communications"},{"issue":"1","key":"9362_CR38","first-page":"1235","volume":"17","author":"X Meng","year":"2016","unstructured":"Meng, X., Bradley, J., Yavuz, B., Sparks, E., Venkataraman, S., Liu, D., Freeman, J., Tsai, D., Amde, M., Owen, S., et al. (2016). Mllib: Machine learning in apache spark. The Journal of Machine Learning Research, 17(1), 1235.","journal-title":"The Journal of Machine Learning Research"},{"key":"9362_CR39","doi-asserted-by":"crossref","unstructured":"Park, W. H., Shin, D. R. & Qureshi, N. M. F. (2021). Effective emotion recognition technique in NLP task over nonlinear big data cluster. Wireless Communications and Mobile Computing, 2021, 5840759.","DOI":"10.1155\/2021\/5840759"},{"key":"9362_CR40","doi-asserted-by":"crossref","unstructured":"Lee, M.S., Kim, E., Nam, C.S., & Shin, D.R. Design of educational big data application using spark, in 2017 19th International Conference on Advanced Communication Technology (ICACT) (IEEE, 2017), pp. 355\u2013357","DOI":"10.23919\/ICACT.2017.7890112"},{"issue":"9","key":"9362_CR41","doi-asserted-by":"publisher","first-page":"e0162721","DOI":"10.1371\/journal.pone.0162721","volume":"11","author":"Z Ye","year":"2016","unstructured":"Ye, Z., Tafti, A. P., He, K. Y., Wang, K., & He, M. M. (2016). Sparktext: Biomedical text mining on big data framework. PloS One, 11(9), e0162721.","journal-title":"PloS One"},{"key":"9362_CR42","doi-asserted-by":"crossref","unstructured":"Tafti, A.P., Behravesh, E., Assefi, M., LaRose, E., Badger, J., & Mayer, J. A.\u00a0Doan, D.\u00a0Page, P.\u00a0Peissig, bigNN: An open-source big data toolkit focused on biomedical sentence classification, in 2017 IEEE International Conference on Big Data (Big Data) (IEEE, 2017), pp. 3888\u20133896","DOI":"10.1109\/BigData.2017.8258394"},{"key":"9362_CR43","unstructured":"RapidMiner Best Data Science and Machine Learning Platform. https:\/\/rapidminer.com\/"},{"key":"9362_CR44","doi-asserted-by":"crossref","unstructured":"Qureshi, N. M. F., Shin, D. R., Siddiqui, I. F. & Chowdhry, B. S. (2017). Storage-tag-aware scheduler for hadoop cluster. IEEE Access, 5,, 13742\u201313755.","DOI":"10.1109\/ACCESS.2017.2725318"},{"key":"9362_CR45","doi-asserted-by":"crossref","unstructured":"Siddiqui, I. F., Qureshi, N. M. F., Shaikh, M. A., Chowdhry, B. S., Abbas, A., Bashir, A. K. & Lee, S. U. J. (2019). Stuck-at fault analytics of IoT devices using knowledge-based data processing strategy in smart grid. Wireless Personal Communications, 106(4), 1969\u20131983.","DOI":"10.1007\/s11277-018-5739-9"},{"key":"9362_CR46","unstructured":"Prekopcsak, Z., Makrai, G., Henk, T., & Gaspar-Papanek, C. Radoop: Analyzing big data with rapidminer and hadoop, in Proceedings of the 2nd RapidMiner community meeting and conference (RCOMM 2011) (Citeseer, 2011), pp. 1\u201312"},{"key":"9362_CR47","doi-asserted-by":"crossref","unstructured":"Wagan, S. A., Junaid, M., Qureshi, N. M. F., Shin, D. R. & Choi, K. (2020). Comparative survey on big data security applications, A blink on interactive security mechanism in apache ozone. In 2020 Global Conference on Wireless and Optical Technologies (GCWOT) (pp. 1\u20136). IEEE.","DOI":"10.1109\/GCWOT49901.2020.9391610"},{"issue":"3","key":"9362_CR48","first-page":"547","volume":"14","author":"JM Jo","year":"2019","unstructured":"Jo, J. M. (2019). Effectiveness of normalization pre-processing of big data to the machine learning performance. The Journal of the Korea institute of electronic communication sciences, 14(3), 547.","journal-title":"The Journal of the Korea institute of electronic communication sciences"},{"key":"9362_CR49","unstructured":"\u201d. scikit-learn: machine learning in python \u2013 scikit-learn 0.24.2 documentation. https:\/\/scikit-learn.org"},{"key":"9362_CR50","doi-asserted-by":"crossref","unstructured":"Qureshi, N. M. F., Farah, I., Siddiqui, B. S. C. & Shin, D. R. (2022). Intelligent MapReduce technique for energy harvesting through IoT devices. Energy Harvesting in Wireless Sensor Networks and Internet of Things, p.259.","DOI":"10.1049\/PBCE124E_ch11"},{"key":"9362_CR51","unstructured":"Chary, D. (2020). Review on Advanced Machine Learning Model: Scikit-Learn"},{"key":"9362_CR52","doi-asserted-by":"crossref","unstructured":"Qureshi, N. M. F., Siddiqui, I. F., Unar, M. A., Uqaili, M. A., Nam, C. S., Shin, D. R., Kim, J., Bashir, A. K. & Abbas, A. (2019). An aggregate mapreduce data block placement strategy for wireless IoT edge nodes in smart grid. Wireless personal communications, 106(4), 2225\u20132236.","DOI":"10.1007\/s11277-018-5936-6"},{"key":"9362_CR53","doi-asserted-by":"crossref","unstructured":"Park, W., Qureshi, N. M. F. & Shin, D. R. (2022). Pseudo NLP joint spam classification technique for big data cluster. Computers, Materials and Continua, 71(1), 517\u2013535.","DOI":"10.32604\/cmc.2022.021421"},{"issue":"2","key":"9362_CR54","doi-asserted-by":"publisher","first-page":"205979912110104","DOI":"10.1177\/20597991211010416","volume":"14","author":"E Fournier-Tombs","year":"2021","unstructured":"Fournier-Tombs, E., & MacKenzie, M. K. (2021). Big data and democratic speech: Predicting deliberative quality using machine learning techniques. Methodological Innovations, 14(2), 20597991211010416.","journal-title":"Methodological Innovations"},{"key":"9362_CR55","doi-asserted-by":"crossref","unstructured":"Erg\u00fcn, B., & \u015eahin, C. Laser point cloud segmentation in MATLAB, in MATLAB (IntechOpen, 2021)","DOI":"10.5772\/intechopen.95249"},{"key":"9362_CR56","volume-title":"Matlab","author":"S Matlab","year":"2012","unstructured":"Junaid, M., Wagan, S. A., Qureshi, N. M. F., Nam, C. S. and Shin, D. R. (2020). Big data predictive analytics for apache spark using machine learning. In 2020 Global Conference on Wireless and Optical Technologies (GCWOT) (pp. 1\u20137). IEEE."},{"key":"9362_CR57","unstructured":"Ozgur, C. (2021). MatLab vs. Python vs. R | Journal of Data Science | School of Statistics, Renmin University of China . https:\/\/jds-online.org\/journal\/JDS\/article\/402\/info"},{"key":"9362_CR58","doi-asserted-by":"crossref","unstructured":"Kamangar, Z. U., Siddiqui, I. F., Arain, Q. A., Kamangar, U. A. & Qureshi, N. M. F. (2021). Personality characteristic-based enhanced software testing levels for crowd outsourcing environment. KSII Transactions on Internet and Information Systems (TIIS), 15(8), 2974\u20132992.","DOI":"10.3837\/tiis.2021.08.015"},{"issue":"7","key":"9362_CR59","first-page":"190","volume":"4","author":"RRV Mohit","year":"2015","unstructured":"Mohit, R. R. V., Katoch, S., Vanjare, A., & Omkar, S. (2015). Classification of complex UCI datasets using machine learning algorithms using hadoop. International Journal of Computer Science and Software Engineering (IJCSSE), 4(7), 190.","journal-title":"International Journal of Computer Science and Software Engineering (IJCSSE)"},{"key":"9362_CR60","doi-asserted-by":"publisher","unstructured":"Peng, H., Liang, D., & Choi, C. (2013).Evaluating parallel logistic regression models, in 2013 IEEE International Conference on Big Data , pp. 119\u2013126. https:\/\/doi.org\/10.1109\/BigData.2013.6691743","DOI":"10.1109\/BigData.2013.6691743"},{"key":"9362_CR61","unstructured":"Duan, R., Ning, Y., Shi, J., Carroll, R.J., Cai, T., & Chen, Y. (2021). On the global identifiability of logistic regression models with misclassified outcomes, arXiv preprint arXiv:2103.12846"},{"key":"9362_CR62","doi-asserted-by":"crossref","unstructured":"Abarda, A., Bentaleb, Y., El\u00a0Moudden, M., Dakkon, M., Azhari, M., Zerouaoui, J., Ettaki, B. (2018). Solving the problem of latent class selection, in Proceedings of the International Conference on Learning and Optimization Algorithms: Theory and Applications (2018), pp. 1\u20136","DOI":"10.1145\/3230905.3230943"},{"issue":"01","key":"9362_CR63","doi-asserted-by":"publisher","first-page":"20","DOI":"10.38094\/jastt20165","volume":"2","author":"B Charbuty","year":"2021","unstructured":"Charbuty, B., & Abdulazeez, A. (2021). Classification based on decision tree algorithm for machine learning. Journal of Applied Science and Technology Trends, 2(01), 20.","journal-title":"Journal of Applied Science and Technology Trends"},{"key":"9362_CR64","doi-asserted-by":"crossref","unstructured":"Sajja, V.R., Lakshmi, P.J., Naik, D.B., Kalluri, H.K. Student Performance Monitoring System Using Decision Tree Classifier, in Machine Intelligence and Soft Computing (Springer, 2021), pp. 393\u2013407","DOI":"10.1007\/978-981-15-9516-5_33"},{"key":"9362_CR65","doi-asserted-by":"publisher","first-page":"1096","DOI":"10.1016\/j.procs.2020.03.062","volume":"170","author":"M Azhari","year":"2020","unstructured":"Azhari, M., Abarda, A., Alaoui, A., Ettaki, B., & Zerouaoui, J. (2020). Detection of pulsar candidates using bagging method. Procedia Computer Science, 170, 1096.","journal-title":"Procedia Computer Science"},{"key":"9362_CR66","doi-asserted-by":"crossref","unstructured":"Azhari, M., Alaoui, A., Abarda, A., Ettaki, B., & Zerouaoui, J. A comparison of random forest methods for solving the problem of pulsar search, in The Proceedings of the Third International Conference on Smart City Applications (Springer, 2019), pp. 796\u2013807","DOI":"10.1007\/978-3-030-37629-1_57"},{"key":"9362_CR67","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/j.jclinepi.2020.12.018","volume":"133","author":"TE Cowling","year":"2021","unstructured":"Cowling, T. E., Cromwell, D. A., Bellot, A., Sharples, L. D., & van der Meulen, J. (2021). Logistic regression and machine learning predicted patient mortality from large sets of diagnosis codes comparably. Journal of Clinical Epidemiology, 133, 43.","journal-title":"Journal of Clinical Epidemiology"},{"issue":"4","key":"9362_CR68","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1016\/S0167-9473(01)00065-2","volume":"38","author":"JH Friedman","year":"2002","unstructured":"Friedman, J. H. (2002). Stochastic gradient boosting. Computational statistics & Data Analysis, 38(4), 367.","journal-title":"Computational statistics & Data Analysis"},{"key":"9362_CR69","unstructured":"UCI machine learning repository: Bank marketing data set. https:\/\/archive.ics.uci.edu\/ml\/datasets\/bank+marketing"},{"key":"9362_CR70","doi-asserted-by":"publisher","first-page":"114463","DOI":"10.1016\/j.eswa.2020.114463","volume":"169","author":"VA Fajardo","year":"2021","unstructured":"Fajardo, V. A., Findlay, D., Jaiswal, C., Yin, X., Houmanfar, R., Xie, H., Liang, J., She, X., & Emerson, D. (2021). On oversampling imbalanced data with deep conditional generative models. Expert Systems with Applications, 169, 114463.","journal-title":"Expert Systems with Applications"},{"issue":"2","key":"9362_CR71","doi-asserted-by":"publisher","first-page":"194","DOI":"10.3390\/sym13020194","volume":"13","author":"Z Jiang","year":"2021","unstructured":"Jiang, Z., Pan, T., Zhang, C., & Yang, J. (2021). A new oversampling method based on the classification contribution degree. Symmetry, 13(2), 194.","journal-title":"Symmetry"}],"updated-by":[{"DOI":"10.1007\/s11277-022-10112-6","type":"correction","label":"Correction","source":"publisher","updated":{"date-parts":[[2022,11,3]],"date-time":"2022-11-03T00:00:00Z","timestamp":1667433600000}}],"container-title":["Wireless Personal Communications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-021-09362-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11277-021-09362-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-021-09362-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T13:19:48Z","timestamp":1744204788000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11277-021-09362-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,23]]},"references-count":71,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2022,10]]}},"alternative-id":["9362"],"URL":"https:\/\/doi.org\/10.1007\/s11277-021-09362-7","relation":{"correction":[{"id-type":"doi","id":"10.1007\/s11277-022-10112-6","asserted-by":"object"}]},"ISSN":["0929-6212","1572-834X"],"issn-type":[{"value":"0929-6212","type":"print"},{"value":"1572-834X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,8,23]]},"assertion":[{"value":"4 November 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 August 2022","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 November 2022","order":3,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Correction","order":4,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"A Correction to this paper has been published:","order":5,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"https:\/\/doi.org\/10.1007\/s11277-022-10112-6","URL":"https:\/\/doi.org\/10.1007\/s11277-022-10112-6","order":6,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}}]}}