{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T15:24:19Z","timestamp":1772119459390,"version":"3.50.1"},"reference-count":28,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T00:00:00Z","timestamp":1733961600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T00:00:00Z","timestamp":1733961600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1007\/s10115-024-02302-4","type":"journal-article","created":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T14:38:57Z","timestamp":1734014337000},"page":"549-578","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Preserving data distribution in sampling and instance selection with Renyi\u2019s divergence"],"prefix":"10.1007","volume":"67","author":[{"given":"Hadi","family":"Sadoghi-Yazdi","sequence":"first","affiliation":[]},{"given":"Soheila","family":"Ashkezari-Toussi","sequence":"additional","affiliation":[]},{"given":"Abolfazl","family":"Ramezanzadeh-Yazdi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,12]]},"reference":[{"key":"2302_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.strusafe.2022.102292","volume":"101","author":"C Song","year":"2023","unstructured":"Song C, Kawai R (2023) Adaptive stratified sampling for structural reliability analysis. Struct Saf 101:102292","journal-title":"Struct Saf"},{"key":"2302_CR2","doi-asserted-by":"crossref","unstructured":"Parsons VL (2014) Stratified sampling. Wiley StatsRef: Statistics Reference Online, pp 1\u201311","DOI":"10.1002\/9781118445112.stat05999.pub2"},{"issue":"2","key":"2302_CR3","doi-asserted-by":"publisher","first-page":"290","DOI":"10.1080\/15598608.2017.1353456","volume":"12","author":"SA Mostafa","year":"2018","unstructured":"Mostafa SA, Ahmad IA (2018) Recent developments in systematic sampling: a review. J Stat Theory Pract 12(2):290\u2013310","journal-title":"J Stat Theory Pract"},{"key":"2302_CR4","doi-asserted-by":"publisher","first-page":"143","DOI":"10.1016\/j.ins.2022.04.036","volume":"602","author":"S Saha","year":"2022","unstructured":"Saha S, Sarker PS, Al Saud A, Shatabda S, Newton MH (2022) Cluster-oriented instance selection for classification problems. Inform Sci 602:143\u2013158","journal-title":"Inform Sci"},{"key":"2302_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.ress.2021.108306","volume":"220","author":"X Zhang","year":"2022","unstructured":"Zhang X, Lu Z, Cheng K (2022) Cross-entropy-based directional importance sampling with von mises-fisher mixture model for reliability analysis. Reliability Eng Syst Saf 220:108306","journal-title":"Reliability Eng Syst Saf"},{"key":"2302_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11227-021-04177-6","volume":"78","author":"J Li","year":"2022","unstructured":"Li J, Wu Y, Fong S, Tall\u00f3n-Ballesteros AJ, Yang XS, Mohammed S, Wu F (2022) A binary PSO-based ensemble under-sampling model for rebalancing imbalanced training data. J Supercomput 78:1\u201336","journal-title":"J Supercomput"},{"key":"2302_CR7","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1016\/j.ins.2021.12.016","volume":"587","author":"M Kordos","year":"2022","unstructured":"Kordos M, Blachnik M, Scherer R (2022) Fuzzy clustering decomposition of genetic algorithm-based instance selection for regression problems. Inform Sci 587:23\u201340","journal-title":"Inform Sci"},{"issue":"4","key":"2302_CR8","doi-asserted-by":"publisher","first-page":"12298","DOI":"10.1002\/eng2.12298","volume":"3","author":"S Susan","year":"2021","unstructured":"Susan S, Kumar A (2021) The balancing trick: optimized sampling of imbalanced datasets\u2014a brief survey of the recent state of the art. Eng Rep 3(4):12298","journal-title":"Eng Rep"},{"key":"2302_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2021\/2314520","volume":"2021","author":"F Zhao","year":"2021","unstructured":"Zhao F, Xin Y, Zhang K, Niu X (2021) Representativeness-based instance selection for intrusion detection. Secur Commun Netw 2021:1\u201313","journal-title":"Secur Commun Netw"},{"key":"2302_CR10","doi-asserted-by":"crossref","unstructured":"Chen R, Xiao Q, Zhang Y, Xu J (2015) Differentially private high-dimensional data publication via sampling-based inference. In: Proceedings of the 21th ACM SIGKDD international conference on knowledge discovery and data mining, pp 129\u2013138","DOI":"10.1145\/2783258.2783379"},{"issue":"11","key":"2302_CR11","doi-asserted-by":"publisher","first-page":"3688","DOI":"10.1016\/j.patcog.2015.05.006","volume":"48","author":"L Jing","year":"2015","unstructured":"Jing L, Tian K, Huang JZ (2015) Stratified feature sampling method for ensemble clustering of high dimensional data. Pattern Recognit 48(11):3688\u20133702","journal-title":"Pattern Recognit"},{"key":"2302_CR12","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1016\/j.asoc.2018.12.024","volume":"76","author":"S Maldonado","year":"2019","unstructured":"Maldonado S, L\u00f3pez J, Vairetti C (2019) An alternative smote oversampling strategy for high-dimensional datasets. Appl Soft Comput 76:380\u2013389","journal-title":"Appl Soft Comput"},{"issue":"11","key":"2302_CR13","doi-asserted-by":"publisher","first-page":"0224365","DOI":"10.1371\/journal.pone.0224365","volume":"14","author":"A Vabalas","year":"2019","unstructured":"Vabalas A, Gowen E, Poliakoff E, Casson AJ (2019) Machine learning algorithm validation with a limited sample size. PloS one 14(11):0224365","journal-title":"PloS one"},{"key":"2302_CR14","unstructured":"Yang D, Hong S, Jang Y, Zhao T, Lee H (2019) Diversity-sensitive conditional generative adversarial networks. arXiv preprint arXiv:1901.09024"},{"key":"2302_CR15","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.neucom.2022.12.046","volume":"524","author":"A Qin","year":"2023","unstructured":"Qin A, Tan Z, Tan X, Wu Y, Jing C, Tang YY (2023) Distribution preserving-based deep semi-NMF for data representation. Neurocomputing 524:69\u201383","journal-title":"Neurocomputing"},{"key":"2302_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.techfore.2021.120796","volume":"169","author":"MSE Shahabadi","year":"2021","unstructured":"Shahabadi MSE, Tabrizchi H, Rafsanjani MK, Gupta B, Palmieri F (2021) A combination of clustering-based under-sampling with ensemble methods for solving imbalanced class problem in intelligent systems. Technol Forecast Soc Change 169:120796","journal-title":"Technol Forecast Soc Change"},{"key":"2302_CR17","doi-asserted-by":"crossref","unstructured":"Lu C, Deng S, Wu Y, Zhou H, Ma W (2022) Federated learning based on optics clustering optimization. Discret Dyn Nat Soc","DOI":"10.1155\/2022\/7151373"},{"key":"2302_CR18","doi-asserted-by":"crossref","unstructured":"Guo H, Guo P, Lu H (2006) A fast mean shift procedure with new iteration strategy and re-sampling. In: 2006 IEEE international conference on systems, man and cybernetics, vol. 3, pp 2385\u20132389. IEEE","DOI":"10.1109\/ICSMC.2006.385220"},{"key":"2302_CR19","doi-asserted-by":"crossref","unstructured":"Schier M, Reinders C, Rosenhahn B (2022) Constrained mean shift clustering. In: Proceedings of the 2022 SIAM international conference on data mining (SDM), pp 235\u2013243. SIAM","DOI":"10.1137\/1.9781611977172.27"},{"key":"2302_CR20","doi-asserted-by":"publisher","first-page":"571","DOI":"10.7717\/peerj-cs.571","volume":"7","author":"NA Saran","year":"2021","unstructured":"Saran NA, Saran M, Nar F (2021) Distribution-preserving data augmentation. Peer J Comput Sci 7:571","journal-title":"Peer J Comput Sci"},{"issue":"7","key":"2302_CR21","doi-asserted-by":"publisher","first-page":"5335","DOI":"10.1007\/s00521-022-07974-z","volume":"35","author":"F Aydin","year":"2023","unstructured":"Aydin F (2023) Unsupervised instance selection via conjectural hyperrectangles. Neural Comput Appl 35(7):5335\u20135349","journal-title":"Neural Comput Appl"},{"issue":"2","key":"2302_CR22","first-page":"853","volume":"26","author":"SO Tovias-Alanis","year":"2022","unstructured":"Tovias-Alanis SO, G\u00f3mez-Flores W, Toscano-Pulido G (2022) Evolutionary instance selection based on preservation of the data probability density function. Comput Sist 26(2):853\u2013866","journal-title":"Comput Sist"},{"issue":"4","key":"2302_CR23","doi-asserted-by":"publisher","first-page":"2047","DOI":"10.1109\/TCYB.2020.3008248","volume":"52","author":"ZZYSWLZXGYS Ji","year":"2020","unstructured":"Ji ZZYSWLZXGYS (2020) Kullback\u2013Leibler divergence metric learning. IEEE Trans Cybern 52(4):2047","journal-title":"IEEE Trans Cybern"},{"key":"2302_CR24","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1016\/j.knosys.2016.10.031","volume":"116","author":"C Liu","year":"2017","unstructured":"Liu C, Wang W, Wang M, Lv F, Konan M (2017) An efficient instance selection algorithm to reconstruct training set for support vector machine. Knowl-Based Syst 116:58\u201373","journal-title":"Knowl-Based Syst"},{"key":"2302_CR25","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2020.106716","volume":"97","author":"M Aslani","year":"2020","unstructured":"Aslani M, Seipel S (2020) A fast instance selection method for support vector machines in building extraction. Appl Soft Comput 97:106716","journal-title":"Appl Soft Comput"},{"key":"2302_CR26","doi-asserted-by":"publisher","first-page":"579","DOI":"10.1016\/j.ins.2021.07.015","volume":"577","author":"M Aslani","year":"2021","unstructured":"Aslani M, Seipel S (2021) Efficient and decision boundary aware instance selection for support vector machines. Inform Sci 577:579\u2013598","journal-title":"Inform Sci"},{"key":"2302_CR27","doi-asserted-by":"publisher","first-page":"558","DOI":"10.1016\/j.ins.2023.01.090","volume":"628","author":"GFA Yeo","year":"2023","unstructured":"Yeo GFA, Akman D, Hudson I, Chan J (2023) A stochastic approximation approach to fixed instance selection. Inform Sci 628:558\u2013579","journal-title":"Inform Sci"},{"key":"2302_CR28","unstructured":"Wah C, Branson S, Welinder P, Perona P, Belongie S (2011) Wahcub. California Institute of Technology (CNS-TR-2011-001)"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-024-02302-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10115-024-02302-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-024-02302-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,31]],"date-time":"2025-01-31T07:04:53Z","timestamp":1738307093000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10115-024-02302-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,12]]},"references-count":28,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["2302"],"URL":"https:\/\/doi.org\/10.1007\/s10115-024-02302-4","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-3333967\/v1","asserted-by":"object"}]},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"value":"0219-1377","type":"print"},{"value":"0219-3116","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,12]]},"assertion":[{"value":"7 September 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 October 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 November 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 December 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflict of interest to declare that are relevant to the content of this article","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}