{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,12]],"date-time":"2026-01-12T21:04:51Z","timestamp":1768251891204,"version":"3.49.0"},"publisher-location":"Cham","reference-count":37,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030821951","type":"print"},{"value":"9783030821968","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,8,3]],"date-time":"2021-08-03T00:00:00Z","timestamp":1627948800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,8,3]],"date-time":"2021-08-03T00:00:00Z","timestamp":1627948800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-030-82196-8_15","type":"book-chapter","created":{"date-parts":[[2021,8,2]],"date-time":"2021-08-02T09:04:52Z","timestamp":1627895092000},"page":"199-215","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Imbalanced Dataset Optimization with New Resampling Techniques"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3843-386X","authenticated-orcid":false,"given":"Ivan","family":"Letteri","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9070-4663","authenticated-orcid":false,"given":"Antonio Di","family":"Cecco","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0329-2419","authenticated-orcid":false,"given":"Abeer","family":"Dyoub","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2327-9393","authenticated-orcid":false,"given":"Giuseppe Della","family":"Penna","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,8,3]]},"reference":[{"key":"15_CR1","unstructured":"Ali, K., Brunk, C., Pazzani, M.: On learning multiple descriptions of a concept, pp. 476\u2013483 (1994)"},{"key":"15_CR2","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1145\/1007730.1007735","volume":"6","author":"G Batista","year":"2004","unstructured":"Batista, G., Prati, R., Monard, M.-C.: A study of the behavior of several methods for balancing machine learning training data. SIGKDD Explor. 6, 20\u201329 (2004)","journal-title":"SIGKDD Explor."},{"issue":"6","key":"15_CR3","first-page":"698","volume":"26","author":"OC Nieto","year":"2020","unstructured":"Nieto, O.C., Y\u00e1\u00f1ez-M\u00e1rquez, C., Villuendas-Rey, Y.: Undersampling instance selection for hybrid and incomplete imbalanced data. J. UCS 26(6), 698\u2013719 (2020)","journal-title":"J. UCS"},{"key":"15_CR4","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla, N.V., Bowyer, K.W., Hall, L.O., Kegelmeyer, W.P.: Smote: synthetic minority over-sampling technique. J. Artif. Intell. Res. 16, 321\u2013357 (2002)","journal-title":"J. Artif. Intell. Res."},{"key":"15_CR5","unstructured":"dos Santos Tanaka, F.H.K., Aranha, C.: Data augmentation using GANs. CoRR, abs\/1904.09135 (2019)"},{"key":"15_CR6","unstructured":"Dyoub, A., Costantini, S., Lisi, F.A., Letteri, I.: Logic-based machine learning for transparent ethical agents. In: Calimeri, F., Perri, S., Zumpano, E. (eds.) Proceedings of the 35th Italian Conference on Computational Logic - CILC 2020, Rende, Italy, 13\u201315 October (2020), volume 2710 of CEUR Workshop Proceedings, pp. 169\u2013183. CEUR-WS.org (2020)"},{"key":"15_CR7","doi-asserted-by":"publisher","first-page":"01","DOI":"10.1007\/978-3-319-10247-4","volume-title":"Data Preprocessing in Data Mining","author":"S Garc\u00eda","year":"2015","unstructured":"Garc\u00eda, S., Luengo, J., Herrera, F.: Data Preprocessing in Data Mining, p. 01. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-10247-4"},{"key":"15_CR8","unstructured":"He, H., Bai, Y., Garcia, E.A., Li, S.: AdaSYN: adaptive synthetic sampling approach for imbalanced learning. In: 2008 IEEE International Joint Conference on Neural Networks (IEEE World Congress on Computational Intelligence), pp. 1322\u20131328 (2008)"},{"issue":"9","key":"15_CR9","doi-asserted-by":"publisher","first-page":"1263","DOI":"10.1109\/TKDE.2008.239","volume":"21","author":"H He","year":"2009","unstructured":"He, H., Garcia, E.A.: Learning from imbalanced data. IEEE Trans. Knowl. Data Eng. 21(9), 1263\u20131284 (2009)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"15_CR10","doi-asserted-by":"crossref","unstructured":"Ivan, T.: An experiment with the edited nearest-neighbor rule. IEEE Trans. Syst. Man Cybern. SMC-6(6), 448\u2013452 (1976)","DOI":"10.1109\/TSMC.1976.4309523"},{"key":"15_CR11","unstructured":"Japkowicz, N.: Class imbalances: are we focusing on the right issue (2003)"},{"key":"15_CR12","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1007\/3-540-45153-6_7","volume-title":"Advances in Artificial Intelligence","author":"N Japkowicz","year":"2001","unstructured":"Japkowicz, N.: Concept-learning in the presence of between-class and within-class imbalances. In: Stroulia, E., Matwin, S. (eds.) Advances in Artificial Intelligence, pp. 67\u201377. Springer, Heidelberg (2001)"},{"issue":"4","key":"15_CR13","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1561\/2200000056","volume":"12","author":"DP Kingma","year":"2019","unstructured":"Kingma, D.P., Welling, M.: An introduction to variational autoencoders. Found. Trends\u00ae Mach. Learn. 12(4), 307\u2013392 (2019)","journal-title":"Found. Trends\u00ae Mach. Learn."},{"key":"15_CR14","unstructured":"Kubat, M., Matwin, S.: Addressing the curse of imbalanced training sets: one-sided selection. In: In: Proceedings of the Fourteenth International Conference on Machine Learning, pp. 179\u2013186. Morgan Kaufmann (1997)"},{"key":"15_CR15","unstructured":"Kukar, M., Kononenko, I.: Cost-sensitive learning with neural networks. In: Prade, H. (eds.) 13th European Conference on Artificial Intelligence, Brighton, UK, 23\u201328 August 1998, Proceedings, pp. 445\u2013449. Wiley (1998)"},{"key":"15_CR16","unstructured":"Last, F., Douzas, G., Ba\u00e7\u00e3o, F.: Oversampling for imbalanced learning based on k-means and SMOTE. CoRR, abs\/1711.00837 (2017)"},{"key":"15_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1007\/3-540-48229-6_9","volume-title":"Artificial Intelligence in Medicine","author":"J Laurikkala","year":"2001","unstructured":"Laurikkala, J.: Improving identification of difficult small classes by balancing class distribution. In: Quaglini, S., Barahona, P., Andreassen, S. (eds.) Artificial Intelligence in Medicine. Lecture Notes in Computer Science, vol. 2101, pp. 63\u201366. Springer, Heidelberg (2001). https:\/\/doi.org\/10.1007\/3-540-48229-6_9"},{"key":"15_CR18","unstructured":"Letteri, I.: MTA-KDD\u201919 dataset (2019). https:\/\/github.com\/IvanLetteri\/MTA-KDD-19"},{"key":"15_CR19","unstructured":"Letteri, I., Di Cecco, A., Penna, G.D.: Dataset optimization strategies for malware traffic detection (2020)"},{"key":"15_CR20","doi-asserted-by":"crossref","unstructured":"Letteri, I., Penna, G.D., Caianiello, P.: Feature selection strategies for HTTP botnet traffic detection. In: 2019 IEEE European Symposium on Security and Privacy Workshops, EuroS&P Workshops 2019, Stockholm, Sweden, 17\u201319 June 2019, pp. 202\u2013210. IEEE (2019)","DOI":"10.1109\/EuroSPW.2019.00029"},{"key":"15_CR21","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1007\/978-3-030-01689-0_4","volume-title":"Cyberspace Safety and Security","author":"I Letteri","year":"2018","unstructured":"Letteri, I., Penna, G.D., De Gasperis, G.: Botnet detection in software defined networks by deep learning techniques. In: Castiglione, A., Pop, F., Ficco, M., Palmieri, F. (eds.) Cyberspace Safety and Security. Lecture Notes in Computer Science, vol. 1161, pp. 49\u201362. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01689-0_4"},{"key":"15_CR22","doi-asserted-by":"crossref","unstructured":"Letteri, I., Penna, G.D., De Gasperis, G.: Security in the internet of things: botnet detection in software-defined networks by deep learning techniques. In: 2020 IJHPCN International Journal of High Performance Computing and Networking, vol. 15, pp. 170\u2013182. IJHPCN (2020)","DOI":"10.1504\/IJHPCN.2019.106095"},{"key":"15_CR23","unstructured":"Letteri, I., Penna, G.D., Di Vita, L., Grifa, M.D.: MTA-KDD\u201919: a dataset for malware traffic detection. In: Loreti, M., Spalazzi, L. (eds.) Proceedings of the Fourth Italian Conference on Cyber Security, Ancona, Italy, February 4th to 7th, 2020, volume 2597 of CEUR Workshop Proceedings, pp. 153\u2013165. CEUR-WS.org (2020)"},{"key":"15_CR24","first-page":"5","volume":"40","author":"M Lieberman","year":"2014","unstructured":"Lieberman, M., Morris, J.: The precise effect of multicollinearity on classification prediction. Multiple Linear Regress. Viewpoints 40, 5\u201310 (2014)","journal-title":"Multiple Linear Regress. Viewpoints"},{"key":"15_CR25","doi-asserted-by":"publisher","first-page":"191","DOI":"10.1023\/A:1012406528296","volume":"46","author":"Y Lin","year":"2000","unstructured":"Lin, Y., Lee, Y., Wahba, G.: Support vector machines for classification in nonstandard situations. Mach. Learn. 46, 191\u2013202 (2000)","journal-title":"Mach. Learn."},{"key":"15_CR26","doi-asserted-by":"crossref","unstructured":"Liu, B., Ma, Y., Wong, C.: Improving an association rule based classifier. Lecture Notes in Computer Science vol. 504\u2013509, no. 01 (1910) (2000)","DOI":"10.1007\/3-540-45372-5_58"},{"key":"15_CR27","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1016\/j.ins.2013.07.007","volume":"250","author":"V L\u00f3pez","year":"2013","unstructured":"L\u00f3pez, V., Fern\u00edndez, A., Garc\u00e1a, S., Palade, V., Herrera, F.: An insight into classification with imbalanced data: Empirical results and current trends on using data intrinsic characteristics. Inf. Sci. 250, 113\u2013141 (2013)","journal-title":"Inf. Sci."},{"key":"15_CR28","first-page":"07","volume":"46","author":"K Napierala","year":"2015","unstructured":"Napierala, K., Stefanowski, J.: Types of minority class examples and their influence on learning classifiers from imbalanced data. J. Intell. Inf. Syst. 46, 07 (2015)","journal-title":"J. Intell. Inf. Syst."},{"key":"15_CR29","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1007\/s10462-010-9165-y","volume":"34","author":"J Olvera-L\u00f3pez","year":"2010","unstructured":"Olvera-L\u00f3pez, J., Carrasco-Ochoa, J., Mart\u00ednez-Trinidad, J.F., Kittler, J.: A review of instance selection methods. Artif. Intell. Rev. 34, 133\u2013143 (2010)","journal-title":"Artif. Intell. Rev."},{"issue":"5","key":"15_CR30","doi-asserted-by":"publisher","first-page":"1093","DOI":"10.1109\/TEVC.2009.2019829","volume":"13","author":"A Orriols-Puig","year":"2009","unstructured":"Orriols-Puig, A., Bernado-Mansilla, E., Goldberg, D.E., Sastry, K., Lanzi, P.L.: FACETwise analysis of XCS for problems with class imbalances. IEEE Trans. Evol. Comput. 13(5), 1093\u20131119 (2009)","journal-title":"IEEE Trans. Evol. Comput."},{"key":"15_CR31","doi-asserted-by":"crossref","unstructured":"Prusa, J., Khoshgoftaar, T.M., Dittman, D.J., Napolitano, a.: Using random undersampling to alleviate class imbalance on tweet sentiment data. In: 2015 IEEE International Conference on Information Reuse and Integration, pp. 197\u2013202 (2015)","DOI":"10.1109\/IRI.2015.39"},{"issue":"3","key":"15_CR32","doi-asserted-by":"publisher","first-page":"252","DOI":"10.1109\/34.75512","volume":"13","author":"SJ Raudys","year":"1991","unstructured":"Raudys, S.J., Jain, A.K.: Small sample size effects in statistical pattern recognition: recommendations for practitioners. IEEE Trans. Pattern Anal. Mach. Intell. 13(3), 252\u2013264 (1991)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"15_CR33","doi-asserted-by":"crossref","unstructured":"S\u00e1ez, J.A., Luengo, J., Herrera, F.: A first study on the noise impact in classes for fuzzy rule based classification systems. In: 2010 IEEE International Conference on Intelligent Systems and Knowledge Engineering, pp. 153\u2013158 (2010)","DOI":"10.1109\/ISKE.2010.5680814"},{"key":"15_CR34","unstructured":"Ting, K.: The problem of small disjuncts: its remedy in decision trees (1994)"},{"key":"15_CR35","doi-asserted-by":"crossref","unstructured":"Van Hulse, J., Khoshgoftaar, T., Napolitano, A.: Experimental perspectives on learning from imbalanced data, vol. 227, pp. 935\u2013942 (2007)","DOI":"10.1145\/1273496.1273614"},{"issue":"1","key":"15_CR36","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1145\/1007730.1007734","volume":"6","author":"GM Weiss","year":"2004","unstructured":"Weiss, G.M.: Mining with rarity: a unifying framework. SIGKDD Explor. Newsl. 6(1), 7\u201319 (2004)","journal-title":"SIGKDD Explor. Newsl."},{"issue":"1","key":"15_CR37","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1109\/TKDE.2006.17","volume":"18","author":"Z-H Zhou","year":"2006","unstructured":"Zhou, Z.-H., Liu, X.-Y.: Training cost-sensitive neural networks with methods addressing the class imbalance problem. IEEE Trans. Knowl. Data Eng. 18(1), 63\u201377 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."}],"container-title":["Lecture Notes in Networks and Systems","Intelligent Systems and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-82196-8_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,20]],"date-time":"2022-05-20T19:20:37Z","timestamp":1653074437000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-82196-8_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,3]]},"ISBN":["9783030821951","9783030821968"],"references-count":37,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-82196-8_15","relation":{},"ISSN":["2367-3370","2367-3389"],"issn-type":[{"value":"2367-3370","type":"print"},{"value":"2367-3389","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,8,3]]},"assertion":[{"value":"3 August 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"IntelliSys","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Proceedings of SAI Intelligent Systems Conference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Amsterdam","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3 September 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"intellisys2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/saiconference.com\/IntelliSys","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}