{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,24]],"date-time":"2026-06-24T17:17:48Z","timestamp":1782321468966,"version":"3.54.5"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,4,11]],"date-time":"2025-04-11T00:00:00Z","timestamp":1744329600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,4,11]],"date-time":"2025-04-11T00:00:00Z","timestamp":1744329600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"DOI":"10.1186\/s40537-025-01137-2","type":"journal-article","created":{"date-parts":[[2025,4,11]],"date-time":"2025-04-11T15:15:41Z","timestamp":1744384541000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":20,"title":["Effective k-nearest neighbor models\u00a0for data classification enhancement"],"prefix":"10.1186","volume":"12","author":[{"given":"Ali A.","family":"Amer","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Sri Devi","family":"Ravana","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Riyaz Ahamed Ariyaluran","family":"Habeeb","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,4,11]]},"reference":[{"issue":"1","key":"1137_CR1","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1186\/s40537-024-00973-y","volume":"11","author":"RK Halder","year":"2024","unstructured":"Halder RK, Uddin MN, Uddin MA, Aryal S, Khraisat A. Enhancing K-nearest neighbor algorithm: a comprehensive review and performance analysis of modifications. J Big Data. 2024;11(1):113.","journal-title":"J Big Data"},{"issue":"1","key":"1137_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.4018\/IJSWIS.346377","volume":"20","author":"AA Amer","year":"2024","unstructured":"Amer AA, Al-Razgan M, Abdalla HI, Al-Asaly M, Alfakih T, Al-Hammadi M. Neighboring-aware hierarchical clustering: a new algorithm and extensive evaluation. Int J Semant Web Inf Syst (IJSWIS). 2024;20(1):1\u201324.","journal-title":"Int J Semant Web Inf Syst (IJSWIS)"},{"key":"1137_CR3","doi-asserted-by":"publisher","DOI":"10.7717\/peerj-cs.641","volume":"7","author":"HI Abdalla","year":"2021","unstructured":"Abdalla HI, Amer AA. Boolean logic algebra driven similarity measure for text based applications. PeerJ Comput Sci. 2021;7: e641.","journal-title":"PeerJ Comput Sci"},{"key":"1137_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.117159","volume":"201","author":"Y Ma","year":"2022","unstructured":"Ma Y, Huang R, Yan M, Li G, Wang T. Attention-based local mean k-nearest centroid neighbor classifier. Expert Syst Appl. 2022;201: 117159.","journal-title":"Expert Syst Appl"},{"key":"1137_CR5","doi-asserted-by":"crossref","unstructured":"Liu D, Jiang C, Cao Y. Probabilistic Local Mean K-Nearest Neighbors Classification. In 2024 IEEE 3rd International Conference on Electrical Engineering, Big Data and Algorithms (EEBDA) (pp. 1118\u20131123). IEEE.\u200f\u200f\u200f 2024.","DOI":"10.1109\/EEBDA60612.2024.10485665"},{"issue":"3","key":"1137_CR6","doi-asserted-by":"publisher","first-page":"657","DOI":"10.1007\/s41066-021-00288-w","volume":"7","author":"M Mailagaha Kumbure","year":"2022","unstructured":"Mailagaha Kumbure M, Luukka P. A generalized fuzzy k-nearest neighbor regression model based on Minkowski distance. Granular Comput. 2022;7(3):657\u201371.","journal-title":"Granular Comput"},{"issue":"1","key":"1137_CR7","first-page":"8","volume":"1","author":"J Mei","year":"2024","unstructured":"Mei J, Chen J. Application of KNN algorithm in diabetes prediction. Front Interdiscip Appl Sci. 2024;1(1):8\u201315.","journal-title":"Front Interdiscip Appl Sci"},{"issue":"1","key":"1137_CR8","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1186\/s40537-022-00587-2","volume":"9","author":"A Zeidan","year":"2022","unstructured":"Zeidan A, Vo HT. Efficient spatial data partitioning for distributed k NN joins. J Big Data. 2022;9(1):77.","journal-title":"J Big Data"},{"issue":"1","key":"1137_CR9","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1186\/s40537-022-00598-z","volume":"9","author":"F Rezaei","year":"2022","unstructured":"Rezaei F, Abbasitabar M, Mirzaei S, Kamari Direh Z, Ahmadi S, Azizi Z, Danialy D. Improve data classification performance in diagnosing diabetes using the Binary Exchange Market Algorithm. J Big Data. 2022;9(1):43.","journal-title":"J Big Data"},{"issue":"1","key":"1137_CR10","doi-asserted-by":"publisher","first-page":"6256","DOI":"10.1038\/s41598-022-10358-x","volume":"12","author":"S Uddin","year":"2022","unstructured":"Uddin S, Haque I, Lu H, Moni MA, Gide E. Comparative performance analysis of K-nearest neighbour (KNN) algorithm and its different variants for disease prediction. Sci Rep. 2022;12(1):6256.","journal-title":"Sci Rep"},{"key":"1137_CR11","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107604","volume":"235","author":"Y Wang","year":"2022","unstructured":"Wang Y, Pan Z, Dong J. A new two-layer nearest neighbor selection method for kNN classifier. Knowl-Based Syst. 2022;235: 107604.","journal-title":"Knowl-Based Syst"},{"key":"1137_CR12","doi-asserted-by":"crossref","unstructured":"Khandelwal M, Rout RK, Umer S, Sahoo KS, Jhanjhi NZ, Shorfuzzaman M, Masud M. A pattern classification model for vowel data using fuzzy nearest neighbor. Intell Autom Soft Comput. 2023;35(3).","DOI":"10.32604\/iasc.2023.029785"},{"key":"1137_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109641","volume":"142","author":"A Ali","year":"2023","unstructured":"Ali A, Hamraz M, Gul N, Khan DM, Aldahmani S, Khan Z. A k nearest neighbour ensemble via extended neighbourhood rule and feature subsets. Pattern Recogn. 2023;142: 109641.","journal-title":"Pattern Recogn"},{"key":"1137_CR14","doi-asserted-by":"crossref","unstructured":"Abdalla HI, Amer AA. Towards highly-efficient k-nearest neighbor algorithm for big data classification. In 2022 5th International Conference on Networking, Information Systems and Security: Envisage Intelligent Systems in 5g\/\/6G-based Interconnected Digital Worlds (NISS) (pp. 1\u20135). IEEE.\u200f 2022.","DOI":"10.1109\/NISS55057.2022.10085013"},{"issue":"3","key":"1137_CR15","doi-asserted-by":"publisher","first-page":"497","DOI":"10.3390\/pr10030497","volume":"10","author":"J Wang","year":"2022","unstructured":"Wang J, Zhou Z, Li Z, Du S. A novel fault detection scheme based on mutual k-nearest neighbor method: application on the industrial processes with outliers. Processes. 2022;10(3):497.","journal-title":"Processes"},{"issue":"2","key":"1137_CR16","doi-asserted-by":"publisher","first-page":"106","DOI":"10.3390\/bdcc7020106","volume":"7","author":"LV Nguyen","year":"2023","unstructured":"Nguyen LV, Vo QT, Nguyen TH. Adaptive KNN-based extended collaborative filtering recommendation services. Big Data Cogn Comput. 2023;7(2):106.","journal-title":"Big Data Cogn Comput"},{"key":"1137_CR17","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2022.108295","volume":"242","author":"J Ren","year":"2022","unstructured":"Ren J, Wang Y, Mao M, Cheung YM. Equalization ensemble for large scale highly imbalanced data classification. Knowl-Based Syst. 2022;242: 108295.","journal-title":"Knowl-Based Syst"},{"key":"1137_CR18","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2021.108126","volume":"120","author":"K Kim","year":"2021","unstructured":"Kim K. Normalized class coherence change-based kNN for classification of imbalanced data. Pattern Recogn. 2021;120: 108126.","journal-title":"Pattern Recogn"},{"key":"1137_CR19","doi-asserted-by":"publisher","DOI":"10.7717\/peerj-cs.194","volume":"5","author":"H Gweon","year":"2019","unstructured":"Gweon H, Schonlau M, Steiner SH. The k conditional nearest neighbor algorithm for classification and class probability estimation. PeerJ Comput Sci. 2019;5: e194.","journal-title":"PeerJ Comput Sci"},{"key":"1137_CR20","doi-asserted-by":"crossref","unstructured":"Saxena V, Bhardwaj S, Saxena AK. Enhancement of K nearest neighbour approach to solve the issue of pattern classification. In AIP Conference Proceedings (Vol. 2427, No. 1). AIP Publishing.\u200f 2023.","DOI":"10.1063\/5.0125071"},{"key":"1137_CR21","doi-asserted-by":"publisher","first-page":"4457","DOI":"10.1007\/s00521-020-05256-0","volume":"33","author":"BW Yuan","year":"2021","unstructured":"Yuan BW, Luo XG, Zhang ZL, Yu Y, Huo HW, Johannes T, Zou XD. A novel density-based adaptive k nearest neighbor method for dealing with overlapping problem in imbalanced datasets. Neural Comput Appl. 2021;33:4457\u201381.","journal-title":"Neural Comput Appl"},{"issue":"2","key":"1137_CR22","doi-asserted-by":"publisher","first-page":"1697","DOI":"10.1002\/int.22692","volume":"37","author":"H Zhang","year":"2022","unstructured":"Zhang H, Dong Y, Xu D. Accelerating exact nearest neighbor search in high dimensional Euclidean space via block vectors. Int J Intell Syst. 2022;37(2):1697\u2013722.","journal-title":"Int J Intell Syst"},{"key":"1137_CR23","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.patrec.2023.08.020","volume":"174","author":"J Yang","year":"2023","unstructured":"Yang J, Tan X, Rahardja S. Outlier detection: how to select k for k-nearest-neighbors-based outlier detectors. Pattern Recogn Lett. 2023;174:112\u20137.","journal-title":"Pattern Recogn Lett"},{"key":"1137_CR24","unstructured":"Shah AA, Ravana SD, Hamid S, Ismail MA. Web credibility assessment: affecting factors and assessment techniques.\u200f Information Research. 2015;20(1), paper 655. Retrieved from https:\/\/informationr.net\/ir\/20-1\/paper663.html."},{"issue":"2","key":"1137_CR25","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1016\/j.joi.2012.12.001","volume":"7","author":"SI Moghadasi","year":"2013","unstructured":"Moghadasi SI, Ravana SD, Raman SN. Low-cost evaluation techniques for information retrieval systems: a review. J Informet. 2013;7(2):301\u201312.","journal-title":"J Informet"},{"key":"1137_CR26","unstructured":"Voulgaris Z, Magoulas GD. Extensions of the k nearest neighbour methods for classification problems. In Proceedings of the 26th IASTED International Conference on Artificial Intelligence and Applications, AIA (Vol. 8, pp. 23\u201328).\u200f 2008."},{"issue":"2","key":"1137_CR27","first-page":"370","volume":"18","author":"NABZ Adli","year":"2024","unstructured":"Adli NABZ, Ahmad M, Ghani NA, Ravana SD, Norman AA. An ensemble classification of mental health in Malaysia related to the Covid-19 pandemic using social media sentiment analysis. KSII Trans Internet Inf Syst (TIIS). 2024;18(2):370\u201396.","journal-title":"KSII Trans Internet Inf Syst (TIIS)"},{"key":"1137_CR28","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1007\/s11063-018-9813-9","volume":"49","author":"M Pourseyyedi","year":"2019","unstructured":"Pourseyyedi M, Forghani Y. Weighted version of extended nearest neighbors. Neural Process Lett. 2019;49:227\u201337.","journal-title":"Neural Process Lett"},{"issue":"9","key":"1137_CR29","doi-asserted-by":"publisher","first-page":"234","DOI":"10.3390\/info9090234","volume":"9","author":"S Mehta","year":"2018","unstructured":"Mehta S, Shen X, Gou J, Niu D. A new nearest centroid neighbor classifier based on k local means using harmonic mean distance. Information. 2018;9(9):234.","journal-title":"Information"},{"key":"1137_CR30","first-page":"126","volume-title":"International Conference on Communications and Networking in China","author":"Y Zhao","year":"2020","unstructured":"Zhao Y, Liu X. A classifier combining local distance mean and centroid for imbalanced datasets. In: International Conference on Communications and Networking in China. Cham: Springer International Publishing; 2020. p. 126\u201339."},{"issue":"14","key":"1137_CR31","first-page":"37","volume":"10","author":"H Parvin","year":"2010","unstructured":"Parvin H, Alizadeh H, Minati B. A modification on k-nearest neighbor classifier. Global J Comp Sci Technol. 2010;10(14):37\u201341.","journal-title":"Global J Comp Sci Technol"},{"key":"1137_CR32","doi-asserted-by":"publisher","first-page":"012047","DOI":"10.1088\/1742-6596\/978\/1\/012047","volume":"978","author":"KU Syaliman","year":"2018","unstructured":"Syaliman KU, Nababan EB, Sitompul OS. Improving the accuracy of k-nearest neighbor using local mean based and distance weight. J Phys Conf Ser. 2018;978:012047.","journal-title":"J Phys Conf Ser"},{"key":"1137_CR33","doi-asserted-by":"publisher","first-page":"313","DOI":"10.1016\/j.ins.2023.02.004","volume":"629","author":"AX Wang","year":"2023","unstructured":"Wang AX, Chukova SS, Nguyen BP. Ensemble k-nearest neighbors based on centroid displacement. Inf Sci. 2023;629:313\u201323.","journal-title":"Inf Sci"},{"issue":"5","key":"1137_CR34","doi-asserted-by":"publisher","first-page":"1601","DOI":"10.1007\/s10618-022-00838-z","volume":"36","author":"F Zhou","year":"2022","unstructured":"Zhou F, Gao S, Ni L, Pavlovski M, Dong Q, Obradovic Z, Qian W. Dynamic self-paced sampling ensemble for highly imbalanced and class-overlapped data classification. Data Min Knowl Disc. 2022;36(5):1601\u201322.","journal-title":"Data Min Knowl Disc"},{"key":"1137_CR35","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1016\/j.knosys.2019.01.016","volume":"167","author":"J Gou","year":"2019","unstructured":"Gou J, Qiu W, Yi Z, Shen X, Zhan Y, Ou W. Locality constrained representation-based K-nearest neighbor classification. Knowl-Based Syst. 2019;167:38\u201352.","journal-title":"Knowl-Based Syst"},{"key":"1137_CR36","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1016\/j.neunet.2020.01.020","volume":"125","author":"J Gou","year":"2020","unstructured":"Gou J, Wang L, Yi Z, Yuan Y, Ou W, Mao Q. Weighted discriminative collaborative competitive representation for robust image classification. Neural Netw. 2020;125:104\u201320.","journal-title":"Neural Netw"},{"issue":"10","key":"1137_CR37","doi-asserted-by":"publisher","first-page":"1151","DOI":"10.1016\/j.patrec.2005.12.016","volume":"27","author":"Y Mitani","year":"2006","unstructured":"Mitani Y, Hamamoto Y. A local mean-based nonparametric classifier. Pattern Recogn Lett. 2006;27(10):1151\u20139.","journal-title":"Pattern Recogn Lett"},{"key":"1137_CR38","doi-asserted-by":"publisher","first-page":"1058","DOI":"10.1093\/comjnl\/bxr131","volume":"55","author":"J Gou","year":"2012","unstructured":"Gou J, Yi Z, Du L, Xiong T. A local mean-based k-nearest centroid neighbor classifier. Comput J. 2012;55:1058\u201371.","journal-title":"Comput J"},{"issue":"3","key":"1137_CR39","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1109\/MCI.2015.2437512","volume":"10","author":"B Tang","year":"2015","unstructured":"Tang B, He H. ENN: extended nearest neighbor method for pattern recognition [research frontier]. IEEE Comput Intell Mag. 2015;10(3):52\u201360.","journal-title":"IEEE Comput Intell Mag"},{"key":"1137_CR40","doi-asserted-by":"crossref","unstructured":"Abdalla HI, Altaf A, Hamzah AA. A threefold-ensemble k-nearest neighbor algorithm. Int J Comput Appl. 2025;1\u201314.\u200f","DOI":"10.1080\/1206212X.2024.2446896"},{"issue":"8","key":"1137_CR41","doi-asserted-by":"publisher","first-page":"6292","DOI":"10.1016\/j.jksuci.2022.01.018","volume":"34","author":"S Suyanto","year":"2022","unstructured":"Suyanto S, Yunanto PE, Wahyuningrum T, Khomsah S. A multi-voter multi-commission nearest neighbor classifier. J King Saud Univ-Comput Inf Sci. 2022;34(8):6292\u2013302.","journal-title":"J King Saud Univ-Comput Inf Sci"},{"key":"1137_CR42","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.116529","volume":"194","author":"J Gou","year":"2022","unstructured":"Gou J, Sun L, Du L, Ma H, Xiong T, Ou W, Zhan Y. A representation coefficient-based k-nearest centroid neighbor classifier. Expert Syst Appl. 2022;194: 116529.","journal-title":"Expert Syst Appl"},{"key":"1137_CR43","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1007\/s00500-008-0323-y","volume":"13","author":"J Alcal\u00e1-Fdez","year":"2009","unstructured":"Alcal\u00e1-Fdez J, Sanchez L, Garcia S, del Jesus MJ, Ventura S, Garrell JM, et al. KEEL: a software tool to assess evolutionary algorithms for data mining problems. Soft Comput. 2009;13:307\u201318.","journal-title":"Soft Comput"},{"key":"1137_CR44","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, et al. Scikit-learn: machine learning in Python. J Mach Learn Res. 2011;12:2825\u201330.","journal-title":"J Mach Learn Res"},{"issue":"7","key":"1137_CR45","first-page":"6651","volume":"35","author":"NA Azhar","year":"2022","unstructured":"Azhar NA, Pozi MSM, Din AM, Jatowt A. An investigation of smote based methods for imbalanced datasets with data complexity analysis. IEEE Trans Knowl Data Eng. 2022;35(7):6651\u201372.","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"3","key":"1137_CR46","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3319532","volume":"10","author":"J Gou","year":"2019","unstructured":"Gou J, Qiu W, Yi Z, Xu Y, Mao Q, Zhan Y. A local mean representation-based K-nearest neighbor classifier. ACM Trans Intell Syst Technol (TIST). 2019;10(3):1\u201325.","journal-title":"ACM Trans Intell Syst Technol (TIST)"},{"key":"1137_CR47","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1016\/j.ins.2020.10.013","volume":"553","author":"B Chen","year":"2021","unstructured":"Chen B, Xia S, Chen Z, Wang B, Wang G. RSMOTE: A self-adaptive robust SMOTE for imbalanced problems with label noise. Inf Sci. 2021;553:397\u2013428.","journal-title":"Inf Sci"},{"key":"1137_CR48","doi-asserted-by":"crossref","unstructured":"Liu W, Chawla S. Class confidence weighted k NN algorithms for imbalanced data sets. In Advances in Knowledge Discovery and Data Mining: 15th Pacific-Asia Conference, PAKDD 2011, Shenzhen, China, May 24\u201327, 2011, Proceedings, Part II 15 (pp. 345\u2013356). Springer Berlin Heidelberg.\u200f 2011.","DOI":"10.1007\/978-3-642-20847-8_29"},{"issue":"27","key":"1137_CR49","doi-asserted-by":"publisher","first-page":"20103","DOI":"10.1007\/s00521-023-08754-z","volume":"35","author":"HI Abdalla","year":"2023","unstructured":"Abdalla HI, Amer AA, Ravana SD. BoW-based neural networks vs. cutting-edge models for single-label text classification. Neural Comput Appl. 2023;35(27):20103\u201316.","journal-title":"Neural Comput Appl"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01137-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s40537-025-01137-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01137-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,11]],"date-time":"2025-04-11T17:09:15Z","timestamp":1744391355000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-025-01137-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,11]]},"references-count":49,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["1137"],"URL":"https:\/\/doi.org\/10.1186\/s40537-025-01137-2","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,4,11]]},"assertion":[{"value":"14 May 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 March 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 April 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"86"}}