{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,28]],"date-time":"2026-04-28T13:31:28Z","timestamp":1777383088703,"version":"3.51.4"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031884825","type":"print"},{"value":"9783031884832","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-88483-2_11","type":"book-chapter","created":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T02:37:11Z","timestamp":1745548631000},"page":"206-219","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["A Systematic Approach to\u00a0Data Normalization and\u00a0Standardization in\u00a0Machine Learning Problems"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8359-2045","authenticated-orcid":false,"given":"Irina","family":"Kalinina","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3517-580X","authenticated-orcid":false,"given":"Aleksandr","family":"Gozhyj","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7421-3565","authenticated-orcid":false,"given":"Peter","family":"Bidyuk","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5341-0973","authenticated-orcid":false,"given":"Victor","family":"Gozhyi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8049-4730","authenticated-orcid":false,"given":"Maksym","family":"Korobchynskyi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7396-6442","authenticated-orcid":false,"given":"Vasiliy","family":"Nadraga","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,4,26]]},"reference":[{"key":"11_CR1","unstructured":"The box-cox and yeo-johnson transformations for continuous variables (2021). https:\/\/statisticaloddsandends.wordpress.com\/2021\/02\/19\/the-box-cox-and-yeo-johnson-transformations-for-continuous-variables\/"},{"issue":"5","key":"11_CR2","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1016\/S0167-8655(00)00112-4","volume":"22","author":"S Aksoy","year":"2001","unstructured":"Aksoy, S., Haralick, R.: Feature normalization and likelihood-based similarity measures for image retrieval. Pattern Recogn. Lett. 22(5), 563\u2013582 (2001). https:\/\/doi.org\/10.1016\/S0167-8655(00)00112-4","journal-title":"Pattern Recogn. Lett."},{"issue":"268","key":"11_CR3","doi-asserted-by":"publisher","first-page":"765","DOI":"10.2307\/2281537","volume":"49","author":"T Anderson","year":"1954","unstructured":"Anderson, T., Darling, D.: A test of goodness-of-fit. J. American Stat. 49(268), 765\u2013769 (1954). https:\/\/doi.org\/10.2307\/2281537","journal-title":"J. American Stat."},{"key":"11_CR4","doi-asserted-by":"crossref","unstructured":"Babichev, S., Lytvynenko, V., Skvor, J., Fiser, J.: Model of the objective clustering inductive technology of gene expression profiles based on sota and dbscan clustering algorithms. Adv. Intell. Syst. Comput. 689 (2018)","DOI":"10.1007\/978-3-319-70581-1_2"},{"key":"11_CR5","doi-asserted-by":"crossref","unstructured":"Babichev, S., Osypenko, V., Lytvynenko, V., Voronenko, M., Korobchynskyi, M.: Comparison analysis of biclustering algorithms with the use of artificial data and gene expression profiles. In: IEEE 38th International Conference on Electronics and Nanotechnology. ELNANO 2018 \u2013 Proceedings 689 (2018)","DOI":"10.1109\/ELNANO.2018.8477439"},{"key":"11_CR6","doi-asserted-by":"publisher","first-page":"390","DOI":"10.1016\/j.neucom.2016.08.081","volume":"218","author":"M Bicego","year":"2016","unstructured":"Bicego, M., Baldo, S.: Properties of the box-cox transformation for pattern classification. Neurocomputing 218, 390\u2013400 (2016). https:\/\/doi.org\/10.1016\/j.neucom.2016.08.081","journal-title":"Neurocomputing"},{"key":"11_CR7","unstructured":"Bidyuk, P., Kalinina, I., Zhebko, O., Gozhyj, A., Hannichenko, T.: Classification system based on ensemble methods for solving machine learning tasks. CEUR\u2013WS 3426 (2023)"},{"key":"11_CR8","unstructured":"Bruce, P., Bruce, A., Gedeck, P.: Practical Statistics for Data Scientists: 50+ Essential Concepts Using R and Python, p.\u00a0368. O\u2019Reilly Media (2020)"},{"key":"11_CR9","doi-asserted-by":"publisher","first-page":"996","DOI":"10.1198\/106186004X12632","volume":"13","author":"G Brys","year":"2004","unstructured":"Brys, G., Hubert, M., Struyf, A.: A robust measure of skewness. J. Comput. Graph. Stat. 13, 996\u20131017 (2004). https:\/\/doi.org\/10.1198\/106186004X12632","journal-title":"J. Comput. Graph. Stat."},{"issue":"3","key":"11_CR10","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1016\/S0167-9473(99)00057-2","volume":"33","author":"K Carling","year":"2000","unstructured":"Carling, K.: Resistant outlier rules and the non-gaussian case. Comput. Stat. Data Anal. 33(3), 249\u2013258 (2000). https:\/\/doi.org\/10.1016\/S0167-9473(99)00057-2","journal-title":"Comput. Stat. Data Anal."},{"key":"11_CR11","unstructured":"Cortez, P., Cerdeira, A., Almeida, F., Matos, T., Reis, J.: Wine quality datasets (2009). http:\/\/www3.dsi.uminho.pt\/pcortez\/wine\/"},{"key":"11_CR12","first-page":"398","volume-title":"The Theory of Stochastic Process","author":"D Cox","year":"1965","unstructured":"Cox, D., Miller, H.: The Theory of Stochastic Process, p. 398. Chapman and Hall, London (1965)"},{"key":"11_CR13","doi-asserted-by":"crossref","unstructured":"Flach, P.: Machine Learning: The Art and Science of Algorithms That Make Sense of Data, p.\u00a0416. Cambridge University Press (2012)","DOI":"10.1017\/CBO9780511973000"},{"issue":"12","key":"11_CR14","doi-asserted-by":"publisher","first-page":"5186","DOI":"10.1016\/j.csda.2007.11.008","volume":"52","author":"M Hubert","year":"2008","unstructured":"Hubert, M., Vandervieren, E.: An adjusted boxplot for skewed distributions. Comput. Stat. Data Anal. 52(12), 5186\u20135201 (2008). https:\/\/doi.org\/10.1016\/j.csda.2007.11.008","journal-title":"Comput. Stat. Data Anal."},{"key":"11_CR15","doi-asserted-by":"publisher","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: accelerating deep network training by reducing internal covariate shift. In: 32nd International Conference on Machine Learning, Lille, France vol. 37, pp. 448\u2013456 (2015). https:\/\/doi.org\/10.1016\/j.procs.2020.09.259","DOI":"10.1016\/j.procs.2020.09.259"},{"key":"11_CR16","unstructured":"Kabacoff, R.: R in action. Data analysis and graphics with R and Tidyverse, p.\u00a0656. Manning Publications Co (2022)"},{"key":"11_CR17","unstructured":"Kalinina, I., Bidyuk, P., Gozhyj, A., Malchenko, P.: Combining forecasts based on time series models in machine learning tasks. CEUR\u2013WS 3426 (2023)"},{"key":"11_CR18","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1007\/978-3-031-16203-9_7","volume":"149","author":"I Kalinina","year":"2023","unstructured":"Kalinina, I., Gozhyj, A.: Methodology for solving forecasting problems based on machine learning methods. Lecture Notes on Data Engineering and Communications Technologies (Switzeland) 149, 105\u2013125 (2023)","journal-title":"Lecture Notes on Data Engineering and Communications Technologies (Switzeland)"},{"key":"11_CR19","doi-asserted-by":"publisher","first-page":"21","DOI":"10.2307\/2347808","volume":"39","author":"A Kimber","year":"1990","unstructured":"Kimber, A.: Exploratory data analysis for possibly censored data from skewed distributions. Appl. Stat. 39, 21\u201330 (1990). https:\/\/doi.org\/10.2307\/2347808","journal-title":"Appl. Stat."},{"key":"11_CR20","unstructured":"Lantz, B.: Machine Learning with R. Learn how to use R to apply powerful machine learning methods and gain an insight into real-world applications, p.\u00a0396. Packt Publishing (2013)"},{"key":"11_CR21","unstructured":"Malato, G.: An introduction to the shapiro-wilk test for normality (2023). https:\/\/builtin.com\/data-science\/shapiro-wilk-test"},{"key":"11_CR22","unstructured":"Manish: Different normalization methods (2022). https:\/\/medium.com\/@mkc940\/different-normalization-methods-a1be71fe9f1#:~:text=Linear%20normalization%2C%20or%20%E2%80%9CMax%2DMin%E2%80%9D&text=In%20laymen\u2019s%20terms%2C%20it%20consists,set%2C%20and%20establish%20a%20base"},{"key":"11_CR23","doi-asserted-by":"publisher","first-page":"27","DOI":"10.5194\/isprs-archives-XLII-4-W4-27-2017","volume":"42","author":"A Naeini","year":"2017","unstructured":"Naeini, A., Babadi, M., Homayouni, S.: Assessment of normalization techniques on the accuracy of hyperspectral data clustering. Int. Arch. Photogramm. Remote. Sens. Spat. Inf. Sci. 42, 27\u201330 (2017). https:\/\/doi.org\/10.5194\/isprs-archives-XLII-4-W4-27-2017","journal-title":"Int. Arch. Photogramm. Remote. Sens. Spat. Inf. Sci."},{"key":"11_CR24","first-page":"257","volume":"6","author":"S Nayak","year":"2014","unstructured":"Nayak, S., Misra, B., Behera, H.: Impact of data normalization on stock index forecasting. Int. J. Comput. Inform. Syst. Indust. Manage. Appl. 6, 257\u2013269 (2014)","journal-title":"Int. J. Comput. Inform. Syst. Indust. Manage. Appl."},{"issue":"1","key":"11_CR25","first-page":"21","volume":"2","author":"N Razali","year":"2011","unstructured":"Razali, N., Yap, B.: Power comparisons of shapiro-wilk, kolmogorov-smirnov, lilliefors and anderson-darling tests. J. Stat. Model. Anal. 2(1), 21\u201333 (2011)","journal-title":"J. Stat. Model. Anal."},{"key":"11_CR26","unstructured":"Shitikov, V.K., Mastitsky, S.E.: Classification, regression and other data mining algorithms using r (2017). https:\/\/github.com\/ranalytics\/data-mining"},{"key":"11_CR27","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2019.105524","volume":"97","author":"A Singh","year":"2020","unstructured":"Singh, A.: Investigating the impact of data normalization on classification performance. Appl. Soft Comput. 97, 105524 (2020). https:\/\/doi.org\/10.1016\/j.asoc.2019.105524","journal-title":"Appl. Soft Comput."},{"key":"11_CR28","doi-asserted-by":"publisher","unstructured":"Starovoitov, V., Golub, Y.: Data normalization in machine learning. Informatics 18(3), 83\u201396 (2021). https:\/\/doi.org\/10.37661\/1816-0301-2021-18-3-83-96","DOI":"10.37661\/1816-0301-2021-18-3-83-96"},{"key":"11_CR29","doi-asserted-by":"publisher","unstructured":"Stephens, M.: Tests based on edf statistics. Goodness-of-Fit Techniques, pp. 97\u2013194 (2017). https:\/\/doi.org\/10.1201\/9780203753064-4","DOI":"10.1201\/9780203753064-4"},{"issue":"2684","key":"11_CR30","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1126\/SCIENCE.103.2684.677","volume":"103","author":"S Stevens","year":"1946","unstructured":"Stevens, S.: On the theory of scales of measurement. Science. New Series 103(2684), 677\u2013680 (1946). https:\/\/doi.org\/10.1126\/SCIENCE.103.2684.677","journal-title":"Science. New Series"},{"issue":"1","key":"11_CR31","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1080\/00031305.1993.10475938","volume":"47","author":"P Velleman","year":"1993","unstructured":"Velleman, P., Wilkinson, L.: Nominal, ordinal, interval, and ratio typologies are misleading. Am. Stat. 47(1), 65\u201372 (1993). https:\/\/doi.org\/10.1080\/00031305.1993.10475938","journal-title":"Am. Stat."},{"key":"11_CR32","doi-asserted-by":"publisher","first-page":"2222","DOI":"10.1016\/j.procs.2020.09.259","volume":"176","author":"J Wieckowski","year":"2020","unstructured":"Wieckowski, J., Salabun, W.: How the normalization of the decision matrix influences the results in the vikor method? Proc. Comput. Sci. 176, 2222\u20132231 (2020). https:\/\/doi.org\/10.1016\/j.procs.2020.09.259","journal-title":"Proc. Comput. Sci."},{"issue":"3","key":"11_CR33","doi-asserted-by":"publisher","first-page":"338","DOI":"10.1016\/S0019-9958(65)90241-X","volume":"8","author":"L Zadeh","year":"1965","unstructured":"Zadeh, L.: Fuzzy sets. Inf. Control 8(3), 338\u2013353 (1965)","journal-title":"Inf. Control"},{"key":"11_CR34","doi-asserted-by":"publisher","first-page":"349","DOI":"10.1007\/978-3-642-10677-4-39","volume":"5863","author":"Q Zhang","year":"2009","unstructured":"Zhang, Q., Sun, S.: Weighted data normalization based on eigenvalues for artificial neural network classification. Proc. Int. Conf. Neural Inform. Process. 5863, 349\u2013356 (2009). https:\/\/doi.org\/10.1007\/978-3-642-10677-4-39","journal-title":"Proc. Int. Conf. Neural Inform. Process."}],"container-title":["Lecture Notes on Data Engineering and Communications Technologies","Lecture Notes in Data Engineering, Computational Intelligence, and Decision-Making, Volume 2"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-88483-2_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T02:37:17Z","timestamp":1745548637000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-88483-2_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031884825","9783031884832"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-88483-2_11","relation":{},"ISSN":["2367-4512","2367-4520"],"issn-type":[{"value":"2367-4512","type":"print"},{"value":"2367-4520","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"26 April 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ISDMCI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Scientific Conference \u201cIntellectual Systems of Decision Making and Problem of Computational Intelligence\u201d","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"\u00dast\u00ed nad Labem","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Czech Republic","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 June 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 June 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"isdmci2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.isdmci.ks.ua\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}