{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,16]],"date-time":"2026-03-16T10:55:38Z","timestamp":1773658538509,"version":"3.50.1"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int. J. Mach. Learn. &amp; Cyber."],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s13042-025-02910-8","type":"journal-article","created":{"date-parts":[[2026,2,2]],"date-time":"2026-02-02T06:19:20Z","timestamp":1770013160000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Optimizing k-anonymity with automated generalization trees: a study on classification utility"],"prefix":"10.1007","volume":"17","author":[{"given":"Taj","family":"Saleh","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"\u00d6mer","family":"Kor\u00e7ak","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,2]]},"reference":[{"issue":"5","key":"2910_CR1","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1109\/JIOT.2017.2714189","volume":"4","author":"X Cheng","year":"2017","unstructured":"Cheng X, Fang L, Yang L, Cui S (2017) Mobile big data: the fuel for data-driven wireless. IEEE Internet Things J 4(5):1489\u20131516. https:\/\/doi.org\/10.1109\/JIOT.2017.2714189","journal-title":"IEEE Internet Things J"},{"issue":"24","key":"2910_CR2","doi-asserted-by":"publisher","first-page":"10571","DOI":"10.3390\/su122410571","volume":"12","author":"J Koo","year":"2020","unstructured":"Koo J, Kang G, Kim Y-G (2020) Security and privacy in big data life cycle: a survey and open challenges. Sustainability 12(24):10571. https:\/\/doi.org\/10.3390\/su122410571 (https:\/\/www.mdpi.com\/2071-1050\/12\/24\/10571)","journal-title":"Sustainability"},{"key":"2910_CR3","doi-asserted-by":"publisher","first-page":"578","DOI":"10.1016\/j.matpr.2022.05.117","volume":"64","author":"A Kiran","year":"2022","unstructured":"Kiran A, Shirisha N (2022) K-anonymization approach for privacy preservation using data perturbation techniques in data mining. Mater Today Proc 64:578\u2013584. https:\/\/doi.org\/10.1016\/j.matpr.2022.05.117","journal-title":"Mater Today Proc"},{"key":"2910_CR4","unstructured":"Sweeney L (2001) Information explosion, confidentiality, disclosure, and data access: theory and practical applications for statistical agencies. pp 43\u201374"},{"key":"2910_CR5","doi-asserted-by":"publisher","unstructured":"Goldsteen A, Ezov G, Shmelkin R, Moffie M, Farkash A (2022) Anonymizing machine learning models, volume 13140 of lecture notes in computer science, Ch.\u00a01. Springer International Publishing, pp 121\u2013136. https:\/\/doi.org\/10.1007\/978-3-030-93944-1_8","DOI":"10.1007\/978-3-030-93944-1_8"},{"key":"2910_CR6","doi-asserted-by":"publisher","unstructured":"de\u00a0Reus P, Oprescu A, van Elsen K (2023) Energy cost and machine learning accuracy impact of k-anonymisation and synthetic data techniques. In: 2023 international conference on ICT for sustainability (ICT4S). IEEE, pp 57\u201365. https:\/\/doi.org\/10.1109\/ict4s58814.2023.00015","DOI":"10.1109\/ict4s58814.2023.00015"},{"key":"2910_CR7","doi-asserted-by":"publisher","unstructured":"Oprescu A, Misdorp S, van Elsen K (2022) Energy cost and accuracy impact of k-anonymity. In: 2022 international conference on ICT for sustainability (ICT4S). pp 65\u201376. https:\/\/doi.org\/10.1109\/ICT4S55073.2022.00018","DOI":"10.1109\/ICT4S55073.2022.00018"},{"key":"2910_CR8","unstructured":"Turkey Regulation (tr) 2016\/6698 (2016). https:\/\/www.kvkk.gov.tr\/Icerik\/6649\/Personal-Data-Protection-Law"},{"key":"2910_CR9","doi-asserted-by":"publisher","unstructured":"Murthy S, Abu\u00a0Bakar A, Abdul\u00a0Rahim F, Ramli R (2019) A comparative study of data anonymization techniques. In: 2019 IEEE 5th international conference on big data security on cloud (BigDataSecurity), IEEE international conference on high performance and smart computing, (HPSC) and IEEE international conference on intelligent data and security (IDS). pp 306\u2013309. https:\/\/doi.org\/10.1109\/BigDataSecurity-HPSC-IDS.2019.00063","DOI":"10.1109\/BigDataSecurity-HPSC-IDS.2019.00063"},{"key":"2910_CR10","doi-asserted-by":"publisher","first-page":"8512","DOI":"10.1109\/ACCESS.2020.3045700","volume":"9","author":"A Majeed","year":"2021","unstructured":"Majeed A, Lee S (2021) Anonymization techniques for privacy preserving data publishing: a comprehensive survey. IEEE Access 9:8512\u20138545. https:\/\/doi.org\/10.1109\/ACCESS.2020.3045700","journal-title":"IEEE Access"},{"key":"2910_CR11","doi-asserted-by":"publisher","unstructured":"Chicaiza J, Cabrera-Loayza MC, Elizalde R, Piedra N (2020) Application of data anonymization in learning analytics. In: Proceedings of the 3rd international conference on applications of intelligent systems, APPIS 2020. Association for Computing Machinery, New York, pp 1\u20132. https:\/\/doi.org\/10.1145\/3378184.3378229","DOI":"10.1145\/3378184.3378229"},{"issue":"5","key":"2910_CR12","doi-asserted-by":"publisher","first-page":"589","DOI":"10.3390\/electronics10050589","volume":"10","author":"SU Bazai","year":"2021","unstructured":"Bazai SU, Jang-Jaccard J, Alavizadeh H (2021) Scalable, high-performance, and generalized subtree data anonymization approach for apache spark. Electronics 10(5):589. https:\/\/doi.org\/10.3390\/electronics10050589 (https:\/\/www.mdpi.com\/2079-9292\/10\/5\/589)","journal-title":"Electronics"},{"key":"2910_CR13","unstructured":"Samarati P, Sweeney L (1998) Protecting privacy when disclosing information: k-anonymity and its enforcement through generalization and suppression, Tech. rep., institution"},{"issue":"2","key":"2910_CR14","doi-asserted-by":"publisher","first-page":"206","DOI":"10.1109\/TKDE.2008.129","volume":"21","author":"A Gionis","year":"2009","unstructured":"Gionis A, Tassa T (2009) k-anonymization with minimal loss of information. IEEE Trans Knowl Data Eng 21(2):206\u2013219. https:\/\/doi.org\/10.1109\/TKDE.2008.129","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"2910_CR15","doi-asserted-by":"crossref","unstructured":"D\u00edaz JSP, Garc\u00eda AL (2023) Comparison of machine learning models applied on anonymized data with different techniques . arXiv:2305.07415","DOI":"10.1109\/CSR57506.2023.10224917"},{"key":"2910_CR16","doi-asserted-by":"publisher","unstructured":"Lin JL, Wei MC (2008) An efficient clustering method for k-anonymization. In: Booktitle, PAIS \u201908. Association for Computing Machinery, New York, pp 46\u201350. https:\/\/doi.org\/10.1145\/1379287.1379297","DOI":"10.1145\/1379287.1379297"},{"key":"2910_CR17","doi-asserted-by":"publisher","unstructured":"Xu J, Wang W, Pei J, Wang X, Shi B, Fu AWC (2006) Utility-based anonymization using local recoding. In: Proceedings of the 12th ACM SIGKDD international conference on knowledge discovery and data mining, KDD \u201906. Association for Computing Machinery, New York, pp 785\u2013790. https:\/\/doi.org\/10.1145\/1150402.1150504","DOI":"10.1145\/1150402.1150504"},{"key":"2910_CR18","doi-asserted-by":"publisher","unstructured":"LeFevre K, DeWitt D, Ramakrishnan R (2006) Mondrian multidimensional k-anonymity. In: 22nd international conference on data engineering (ICDE\u201906). pp 25\u201325. https:\/\/doi.org\/10.1109\/ICDE.2006.101","DOI":"10.1109\/ICDE.2006.101"},{"issue":"5","key":"2910_CR19","doi-asserted-by":"publisher","first-page":"670","DOI":"10.1197\/jamia.M3144","volume":"16","author":"K El Emam","year":"2009","unstructured":"El Emam K, Dankar FK, Issa R, Jonker E, Amyot D, Cogo E, Corriveau J-P, Walker M, Chowdhury S, Vaillancourt R, Roffey T, Bottomley J (2009) A globally optimal k-anonymity method for the de-identification of health data. J Am Med Inform Assoc 16(5):670\u2013682. https:\/\/doi.org\/10.1197\/jamia.M3144","journal-title":"J Am Med Inform Assoc"},{"key":"2910_CR20","first-page":"155","volume":"5","author":"H Wimmer","year":"2014","unstructured":"Wimmer H, Powell LM (2014) A comparison of the effects of k-anonymity on machine learning algorithms. Int J Adv Comput Sci Appl 5:155\u2013160","journal-title":"Int J Adv Comput Sci Appl"},{"issue":"3","key":"2910_CR21","doi-asserted-by":"publisher","first-page":"334","DOI":"10.1109\/TKDE.2009.91","volume":"22","author":"S Kisilevich","year":"2010","unstructured":"Kisilevich S, Rokach L, Elovici Y, Shapira B (2010) Efficient multidimensional suppression for k-anonymity. IEEE Trans Knowl Data Eng 22(3):334\u2013347. https:\/\/doi.org\/10.1109\/TKDE.2009.91","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"3","key":"2910_CR22","doi-asserted-by":"publisher","first-page":"622","DOI":"10.1016\/j.datak.2007.03.009","volume":"63","author":"ME Nergiz","year":"2007","unstructured":"Nergiz ME, Clifton C (2007) Thoughts on k-anonymization. Data Knowl Eng 63(3):622\u2013645. https:\/\/doi.org\/10.1016\/j.datak.2007.03.009","journal-title":"Data Knowl Eng"},{"key":"2910_CR23","doi-asserted-by":"publisher","first-page":"571","DOI":"10.1142\/S021848850200165X","volume":"10","author":"L Sweeney","year":"2002","unstructured":"Sweeney L (2002) Achieving k-anonymity privacy protection using generalization and suppression. Int J Uncertain Fuzziness Knowl Based Syst 10:571\u2013588","journal-title":"Int J Uncertain Fuzziness Knowl Based Syst"},{"key":"2910_CR24","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1016\/j.ins.2013.07.034","volume":"256","author":"M Last","year":"2014","unstructured":"Last M, Tassa T, Zhmudyak A, Shmueli E (2014) Improving accuracy of classification models induced from anonymized datasets. Inf Sci 256:138\u2013161. https:\/\/doi.org\/10.1016\/j.ins.2013.07.034","journal-title":"Inf Sci"},{"key":"2910_CR25","doi-asserted-by":"publisher","unstructured":"Chang R-I, Lee C-Y, Chen P-W, Wang C-H (2023) Machine learning of k-anonymity data by using feature importance and margin preservation. In: IEEE global conference on artificial intelligence and internet of things (GCAIoT). pp 91\u201396. https:\/\/doi.org\/10.1109\/GCAIoT61060.2023.10385127","DOI":"10.1109\/GCAIoT61060.2023.10385127"},{"key":"2910_CR26","unstructured":"Slijepcevic D, Henzl M, Klausner LD, Dam T, Kieseberg P, Zeppelzauer M (2021) k-Anonymity in practice: how generalisation and suppression affect machine learning classifiers. arXiv:2102.04763"},{"key":"2910_CR27","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-84858-7","volume-title":"The elements of statistical learning: data mining, inference, and prediction","author":"T Hastie","year":"2009","unstructured":"Hastie T, Tibshirani R, Friedman J (2009) The elements of statistical learning: data mining, inference, and prediction. Springer Science & Business Media, Berlin"},{"key":"2910_CR28","volume-title":"C4.5: programs for machine learning","author":"JR Quinlan","year":"1993","unstructured":"Quinlan JR (1993) C4.5: programs for machine learning. Morgan Kaufmann Publishers, New York"},{"issue":"1","key":"2910_CR29","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Mach Learn 45(1):5\u201332. https:\/\/doi.org\/10.1023\/A:1010933404324","journal-title":"Mach Learn"},{"key":"2910_CR30","doi-asserted-by":"publisher","unstructured":"Ray S(2019) A quick review of machine learning algorithms. In: 2019 international conference on machine learning, big data, cloud and parallel computing (COMITCon). pp 35\u201339. https:\/\/doi.org\/10.1109\/COMITCon.2019.8862451","DOI":"10.1109\/COMITCon.2019.8862451"},{"issue":"1","key":"2910_CR31","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y Freund","year":"1997","unstructured":"Freund Y, Schapire RE (1997) A decision-theoretic generalization of on-line learning and an application to boosting. J Comput Syst Sci 55(1):119\u2013139. https:\/\/doi.org\/10.1006\/jcss.1997.1504","journal-title":"J Comput Syst Sci"},{"key":"2910_CR32","doi-asserted-by":"publisher","unstructured":"Chen T, Guestrin C (2016) XGBoost. In: Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining. ACM, pp 1\u20132. https:\/\/doi.org\/10.1145\/2939672.2939785","DOI":"10.1145\/2939672.2939785"},{"issue":"1","key":"2910_CR33","doi-asserted-by":"publisher","first-page":"785","DOI":"10.1038\/s41597-022-01894-2","volume":"9","author":"J Sainz-Pardo Diaz","year":"2022","unstructured":"Sainz-Pardo Diaz J, Lopez Garcia A (2022) A Python library to check the level of anonymity of a dataset. Sci Data 9(1):785. https:\/\/doi.org\/10.1038\/s41597-022-01894-2 (https:\/\/www.nature.com\/articles\/s41597-022-01894-2)","journal-title":"Sci Data"},{"issue":"2","key":"2910_CR34","doi-asserted-by":"publisher","DOI":"10.2196\/ijmr.2140","volume":"1","author":"S Yoo","year":"2012","unstructured":"Yoo S, Shin M, Lee D (2012) An approach to reducing information loss and achieving diversity of sensitive attributes in k-anonymity methods. Interact J Med Res 1(2):e2140","journal-title":"Interact J Med Res"},{"key":"2910_CR35","doi-asserted-by":"publisher","unstructured":"Machanavajjhala A, Gehrke J, Kifer D, Venkitasubramaniam M (2006) L-diversity: privacy beyond k-anonymity. In: 22nd international conference on data engineering (ICDE\u201906). pp 24\u201324. https:\/\/doi.org\/10.1109\/ICDE.2006.1","DOI":"10.1109\/ICDE.2006.1"},{"key":"2910_CR36","doi-asserted-by":"publisher","unstructured":"Li N, Li T, Venkatasubramanian S (2007) t-closeness: Privacy beyond k-anonymity and l-diversity. In: 2007 IEEE 23rd international conference on data engineering. pp. 106\u2013115. https:\/\/doi.org\/10.1109\/ICDE.2007.367856","DOI":"10.1109\/ICDE.2007.367856"},{"key":"2910_CR37","unstructured":"Jayaraman B, Evans D (2019) Evaluating differentially private machine learning in practice. In: Proceedings of the 28th USENIX conference on security symposium, SEC\u201919. USENIX Association, pp 1895\u20131912"},{"key":"2910_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2024.127663","volume":"589","author":"K Pan","year":"2024","unstructured":"Pan K, Ong Y-S, Gong M, Li H, Qin A, Gao Y (2024) Differential privacy in deep learning: a literature survey. Neurocomputing 589:127663. https:\/\/doi.org\/10.1016\/j.neucom.2024.127663. (https:\/\/www.sciencedirect.com\/science\/article\/pii\/S092523122400434X)","journal-title":"Neurocomputing"},{"issue":"2","key":"2910_CR39","first-page":"161","volume":"6","author":"C Clifton","year":"2013","unstructured":"Clifton C, Tassa T (2013) On syntactic anonymity and differential privacy. Trans Data Privacy 6(2):161\u2013183","journal-title":"Trans Data Privacy"},{"issue":"7","key":"2910_CR40","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1145\/3433638","volume":"64","author":"J Domingo-Ferrer","year":"2021","unstructured":"Domingo-Ferrer J, S\u00e1nchez D, Blanco-Justicia A (2021) The limits of differential privacy (and its misuse in data release and machine learning). Commun ACM 64(7):33\u201335. https:\/\/doi.org\/10.1145\/3433638","journal-title":"Commun ACM"},{"key":"2910_CR41","doi-asserted-by":"publisher","unstructured":"Kifer D, Machanavajjhala A (2011) No free lunch in data privacy. In: Proceedings of the ACM SIGMOD international conference on management of data, SIGMOD \u201911. Association for Computing Machinery, New York, pp 193\u2013204. https:\/\/doi.org\/10.1145\/1989323.1989345","DOI":"10.1145\/1989323.1989345"},{"issue":"8","key":"2910_CR42","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3547139","volume":"55","author":"A Blanco-Justicia","year":"2022","unstructured":"Blanco-Justicia A, S\u00e1nchez D, Domingo-Ferrer J, Muralidhar K (2022) A critical review on the use (and misuse) of differential privacy in machine learning. ACM Comput Surv 55(8):1\u201316. https:\/\/doi.org\/10.1145\/3547139","journal-title":"ACM Comput Surv"},{"issue":"5","key":"2910_CR43","doi-asserted-by":"publisher","first-page":"670","DOI":"10.1197\/jamia.m3144","volume":"16","author":"KE Emam","year":"2009","unstructured":"Emam KE, Dankar FK, Issa R, Jonker E, Amyot D, Cogo E, Corriveau J-P, Walker M, Chowdhury S, Vaillancourt R, Roffey T, Bottomley J (2009) A globally optimal k-anonymity method for the de-identification of health data. J Am Med Inform Assoc 16(5):670\u2013682. https:\/\/doi.org\/10.1197\/jamia.m3144 (https:\/\/doi.org\/10.1197%2Fjamia.m3144)","journal-title":"J Am Med Inform Assoc"},{"issue":"11","key":"2910_CR44","doi-asserted-by":"publisher","first-page":"4164","DOI":"10.1118\/1.2786864","volume":"34","author":"M Elter","year":"2007","unstructured":"Elter M, Schulz-Wendtland R, Wittenberg T (2007) The prediction of breast cancer biopsy outcomes using two cad approaches that both emphasize an intelligible decision process. Med Phys 34(11):4164\u20134172. https:\/\/doi.org\/10.1118\/1.2786864","journal-title":"Med Phys"}],"container-title":["International Journal of Machine Learning and Cybernetics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-025-02910-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13042-025-02910-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-025-02910-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,16]],"date-time":"2026-03-16T09:56:42Z","timestamp":1773655002000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13042-025-02910-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2]]},"references-count":44,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["2910"],"URL":"https:\/\/doi.org\/10.1007\/s13042-025-02910-8","relation":{},"ISSN":["1868-8071","1868-808X"],"issn-type":[{"value":"1868-8071","type":"print"},{"value":"1868-808X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2]]},"assertion":[{"value":"23 November 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflict of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"73"}}