{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T20:00:28Z","timestamp":1781726428190,"version":"3.54.5"},"reference-count":100,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2020,2,22]],"date-time":"2020-02-22T00:00:00Z","timestamp":1582329600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,2,22]],"date-time":"2020-02-22T00:00:00Z","timestamp":1582329600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2020,10]]},"DOI":"10.1007\/s10462-020-09814-9","type":"journal-article","created":{"date-parts":[[2020,2,22]],"date-time":"2020-02-22T08:03:17Z","timestamp":1582358597000},"page":"5019-5081","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":138,"title":["Applicability of machine learning in spam and phishing email filtering: review and approaches"],"prefix":"10.1007","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0489-9573","authenticated-orcid":false,"given":"Tushaar","family":"Gangavarapu","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"C. D.","family":"Jaidhar","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Bhabesh","family":"Chanduka","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2020,2,22]]},"reference":[{"key":"9814_CR1","doi-asserted-by":"crossref","unstructured":"Abu-Nimeh S, Nappa D, Wang X, Nair S (2007) A comparison of machine learning techniques for phishing detection. In: Proceedings of the anti-phishing working groups 2nd annual eCrime researchers summit. ACM, pp 60\u201369 (2007)","DOI":"10.1145\/1299015.1299021"},{"key":"9814_CR2","doi-asserted-by":"publisher","DOI":"10.1155\/2014\/425731","author":"AA Akinyelu","year":"2014","unstructured":"Akinyelu AA, Adewumi AO (2014) Classification of phishing email using random forest machine learning technique. J Appl Math. https:\/\/doi.org\/10.1155\/2014\/425731","journal-title":"J Appl Math"},{"key":"9814_CR3","first-page":"2","volume":"11","author":"I Alkaht","year":"2016","unstructured":"Alkaht I, Al-Khatib B (2016) Filtering spam using several stages neural networks. Int Rev Comp Softw 11:2","journal-title":"Int Rev Comp Softw"},{"key":"9814_CR4","doi-asserted-by":"crossref","unstructured":"Almeida TA, Yamakami A (2010) Content-based spam filtering. In: The 2010 international joint conference on neural networks (IJCNN). IEEE, pp 1\u20137 (2010)","DOI":"10.1109\/IJCNN.2010.5596569"},{"key":"9814_CR5","doi-asserted-by":"crossref","unstructured":"Apruzzese G, Colajanni M, Ferretti L, Guido A, Marchetti M (2018) On the effectiveness of machine and deep learning for cyber security. In: 2018 10th International conference on cyber conflict (CyCon). IEEE, pp 371\u2013390 (2018)","DOI":"10.23919\/CYCON.2018.8405026"},{"key":"9814_CR6","doi-asserted-by":"crossref","unstructured":"Auffarth B, L\u00f3pez M, Cerquides J (2010) Comparison of redundancy and relevance measures for feature selection in tissue classification of ct images. In: Industrial conference on data mining. Springer, pp 248\u2013262 (2010)","DOI":"10.1007\/978-3-642-14400-4_20"},{"issue":"1","key":"9814_CR7","first-page":"173","volume":"3","author":"W Awad","year":"2011","unstructured":"Awad W, ELseuofi S (2011) Machine learning methods for spam e-mail classification. Int J Comput Sci Inf Technol 3(1):173\u2013184","journal-title":"Int J Comput Sci Inf Technol"},{"issue":"4","key":"9814_CR8","first-page":"17","volume":"8","author":"M Awad","year":"2016","unstructured":"Awad M, Foqaha M (2016) Email spam classification using hybrid approach of rbf neural network and particle swarm optimization. Int J Netw Secur Appl 8(4):17\u201328","journal-title":"Int J Netw Secur Appl"},{"key":"9814_CR9","unstructured":"Basnet RB, Sung AH (2010) Classifying phishing emails using confidence-weighted linear classifiers. In: International conference on information security and artificial intelligence (ISAI), pp 108\u2013112 (2010)"},{"key":"9814_CR10","unstructured":"Bec scams trends and themes (2019) Bec scams remain a billion-dollar enterprise, targeting 6k businesses monthly. https:\/\/www.symantec.com\/blogs\/threat-intelligence\/bec-scams-trends-and-themes-2019. Accessed 07 May 2019"},{"issue":"1","key":"9814_CR11","doi-asserted-by":"publisher","first-page":"7","DOI":"10.3233\/JCS-2010-0371","volume":"18","author":"A Bergholz","year":"2010","unstructured":"Bergholz A, De Beer J, Glahn S, Moens MF, Paa\u00df G, Strobel S (2010) New filtering approaches for phishing email. J Comput Secur 18(1):7\u201335","journal-title":"J Comput Secur"},{"key":"9814_CR12","unstructured":"Bhagyashri G, Pratap H, Patil D (2013) Auto e-mails classification using bayesian filter. Int J Adv Technol Eng Res 3(4)"},{"key":"9814_CR13","unstructured":"Bhowmick A, Hazarika SM (2016) Machine learning for e-mail spam filtering: review, techniques and trends. arXiv preprint arXiv:1606.01042"},{"key":"9814_CR14","doi-asserted-by":"crossref","unstructured":"Biggio B, Corona I, Fumera G, Giacinto G, Roli F (2011) Bagging classifiers for fighting poisoning attacks in adversarial classification tasks. In: International workshop on multiple classifier systems. Springer, pp 350\u2013359 (2011)","DOI":"10.1007\/978-3-642-21557-5_37"},{"issue":"9","key":"9814_CR15","first-page":"179","volume":"5","author":"SD Bolboaca","year":"2006","unstructured":"Bolboaca SD, J\u00e4ntschi L (2006) Pearson versus spearman, kendall tau correlation analysis on structure\u2013activity relationships of biologic active compounds. Leonardo J Sci 5(9):179\u2013200","journal-title":"Leonardo J Sci"},{"key":"9814_CR16","unstructured":"Breiman L (2002) Manual on setting up, using, and understanding random forests v3. 1. Statistics Department University of California, Berkeley, p 1"},{"issue":"1","key":"9814_CR17","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Mach Learn 45(1):5\u201332","journal-title":"Mach Learn"},{"key":"9814_CR18","doi-asserted-by":"publisher","DOI":"10.1201\/9781315139470","volume-title":"Classification and regression trees","author":"L Breiman","year":"2017","unstructured":"Breiman L (2017) Classification and regression trees. Routledge, Abingdon"},{"key":"9814_CR19","unstructured":"Chandrasekaran M, Narayanan K, Upadhyaya S (2006) Phishing email detection based on structural properties. In: NYS cyber security conference, vol\u00a03. Albany, New York (2006)"},{"key":"9814_CR20","first-page":"662","volume-title":"Intelligent systems design and applications","author":"B Chanduka","year":"2018","unstructured":"Chanduka B, Gangavarapu T, Jaidhar CD (2018) A single program multiple data algorithm for feature selection. In: Abraham A, Cherukuri AK, Melin P, Gandhi N (eds) Intelligent systems design and applications. Springer, Cham, pp 662\u2013672"},{"key":"9814_CR21","unstructured":"Choudhary M, Dhaka V (2013) Automatic e-mails classification using genetic algorithm. In: Special conference issue: national conference on cloud computing and big data. Citeseer, pp 42\u201349 (2013)"},{"key":"9814_CR22","first-page":"3126","volume":"2","author":"V Christina","year":"2010","unstructured":"Christina V, Karpagavalli S, Suganya G (2010) Email spam filtering using supervised machine learning techniques. Int J Comput Sci Eng 2:3126\u20133129","journal-title":"Int J Comput Sci Eng"},{"issue":"4","key":"9814_CR23","doi-asserted-by":"publisher","first-page":"335","DOI":"10.1561\/1500000006","volume":"1","author":"GV Cormack","year":"2008","unstructured":"Cormack GV (2008) Email spam filtering: a systematic review. Found Trends Inf Retriev 1(4):335\u2013455","journal-title":"Found Trends Inf Retriev"},{"key":"9814_CR25","doi-asserted-by":"crossref","unstructured":"Dhanaraj S, Karthikeyani V (2013) A study on e-mail image spam filtering techniques. In: 2013 International conference on pattern recognition, informatics and mobile engineering. IEEE, pp 49\u201355 (2013)","DOI":"10.1109\/ICPRIME.2013.6496446"},{"issue":"17","key":"9814_CR24","first-page":"118","volume":"8","author":"KR Dhanaraj","year":"2014","unstructured":"Dhanaraj KR, Palaniswami V (2014) Firefly and bayes classifier for email spam classification in a distributed environment. Aust J Basic Appl Sci 8(17):118\u2013130","journal-title":"Aust J Basic Appl Sci"},{"issue":"1","key":"9814_CR26","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1471-2105-7-3","volume":"7","author":"R D\u00edaz-Uriarte","year":"2006","unstructured":"D\u00edaz-Uriarte R, De Andres SA (2006) Gene selection and classification of microarray data using random forest. BMC Bioinform 7(1):3","journal-title":"BMC Bioinform"},{"key":"9814_CR27","doi-asserted-by":"crossref","unstructured":"Fette I, Sadeh N, Tomasic A (2007) Learning to detect phishing emails. In: Proceedings of the 16th international conference on world wide web. ACM, pp 649\u2013656 (2007)","DOI":"10.1145\/1242572.1242660"},{"key":"9814_CR28","unstructured":"Gang S (2017) Email overload: research and statistics [with infographic]. https:\/\/blog.sanebox.com\/2016\/02\/18\/email-overload-research-statistics-sanebox\/"},{"key":"9814_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2019.10553","author":"T Gangavarapu","year":"2019","unstructured":"Gangavarapu T, Patil N (2019) A novel filter-wrapper hybrid greedy ensemble approach optimized using the genetic algorithm to reduce the dimensionality of high-dimensional biomedical datasets. Appl Soft Comput. https:\/\/doi.org\/10.1016\/j.asoc.2019.10553","journal-title":"Appl Soft Comput"},{"key":"9814_CR29","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1007\/978-3-030-23281-8_16","volume-title":"Natural language processing and information systems","author":"T Gangavarapu","year":"2019","unstructured":"Gangavarapu T, Jayasimha A, Krishnan GS, Kamath SS (2019a) TAGS: towards automated classification of unstructured clinical nursing notes. In: M\u00e9tais E, Meziane F, Vadera S, Sugumaran V, Saraee M (eds) Natural language processing and information systems. Springer, Cham, pp 195\u2013207"},{"key":"9814_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2019.105321","author":"T Gangavarapu","year":"2019","unstructured":"Gangavarapu T, Jayasimha A, Krishnan GS, Kamath S (2019b) Predicting ICD-9 code groups with fuzzy similarity based supervised multi-label classification of unstructured clinical nursing notes. Knowl Based Syst. https:\/\/doi.org\/10.1016\/j.knosys.2019.105321","journal-title":"Knowl Based Syst"},{"key":"9814_CR31","doi-asserted-by":"crossref","unstructured":"Gangavarapu T, Krishnan GS, Kamath S (2019c) Coherence-based modeling of clinical concepts inferred from heterogeneous clinical notes for icu patient risk stratification. In: Proceedings of the 23rd conference on computational natural language learning (CoNLL), pp 1012\u20131022 (2019)","DOI":"10.18653\/v1\/K19-1095"},{"key":"9814_CR33","doi-asserted-by":"crossref","unstructured":"Gansterer WN, P\u00f6lz D (2009) E-mail classification for phishing defense. In: European conference on information retrieval. Springer, pp 449\u2013460 (2009)","DOI":"10.1007\/978-3-642-00958-7_40"},{"issue":"1","key":"9814_CR34","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s10994-006-6226-1","volume":"63","author":"P Geurts","year":"2006","unstructured":"Geurts P, Ernst D, Wehenkel L (2006) Extremely randomized trees. Mach Learn 63(1):3\u201342. https:\/\/doi.org\/10.1007\/s10994-006-6226-1","journal-title":"Mach Learn"},{"key":"9814_CR35","unstructured":"Guerra PHC, Guedes D, Meira JW, Hoepers C, Chaves M, Steding-Jessen K (2010) Exploring the spam arms race to characterize spam evolution. In: Proceedings of the 7th collaboration, electronic messaging, anti-abuse and spam conference (CEAS), Redmond"},{"issue":"1","key":"9814_CR36","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH (2009) The weka data mining software: an update. ACM SIGKDD Explor Newsl 11(1):10\u201318","journal-title":"ACM SIGKDD Explor Newsl"},{"key":"9814_CR37","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.cose.2014.04.002","volume":"45","author":"IRA Hamid","year":"2014","unstructured":"Hamid IRA, Abawajy JH (2014) An approach for profiling phishing activities. Comput Secur 45:27\u201341","journal-title":"Comput Secur"},{"issue":"7","key":"9814_CR38","doi-asserted-by":"publisher","first-page":"621","DOI":"10.2165\/00002018-200730070-00010","volume":"30","author":"DJ Hand","year":"2007","unstructured":"Hand DJ (2007) Principles of data mining. Drug Saf 30(7):621\u2013622","journal-title":"Drug Saf"},{"key":"9814_CR39","unstructured":"Han J, Liu Y, Sun X (2013) A scalable random forest algorithm based on mapreduce. In: 2013 IEEE 4th International conference on software engineering and service science. IEEE, pp 849\u2013852 (2013)"},{"issue":"20","key":"9814_CR40","first-page":"0975","volume":"122","author":"D Hassan","year":"2015","unstructured":"Hassan D (2015) On determining the most effective subset of features for detecting phishing websites. Int J Comput Appl 122(20):0975\u20138887","journal-title":"Int J Comput Appl"},{"key":"9814_CR41","doi-asserted-by":"crossref","unstructured":"Hassanpour R, Dogdu E, Choupani R, Goker O, Nazli N (2018) Phishing e-mail detection by using deep learning algorithms. In: Proceedings of the ACMSE 2018 conference. ACM, p\u00a045","DOI":"10.1145\/3190645.3190719"},{"issue":"3","key":"9814_CR42","doi-asserted-by":"publisher","first-page":"349","DOI":"10.4310\/SII.2009.v2.n3.a8","volume":"2","author":"T Hastie","year":"2009","unstructured":"Hastie T, Rosset S, Zhu J, Zou H (2009) Multi-class adaboost. Stat Interface 2(3):349\u2013360","journal-title":"Stat Interface"},{"key":"9814_CR43","unstructured":"Idris I, Abdulhamid SM (2014) An improved ais based e-mail classification technique for spam detection. arXiv preprint arXiv:1402.1242"},{"key":"9814_CR44","doi-asserted-by":"crossref","unstructured":"Issac B, Jap WJ (2009) Implementing spam detection using bayesian and porter stemmer keyword stripping approaches. In: TENCON 2009-2009 IEEE region 10 conference. IEEE, pp 1\u20135 (2009)","DOI":"10.1109\/TENCON.2009.5396056"},{"key":"9814_CR45","doi-asserted-by":"crossref","unstructured":"Jayasimha A, Gangavarapu T, Kamath SS, Krishnan GS (2020) Deep neural learning for automated diagnostic code group prediction using unstructured nursing notes. In: Proceedings of the 7th ACM IKDD CoDS and 25th COMAD, pp 152\u2013160 (2020)","DOI":"10.1145\/3371158.3371176"},{"issue":"5","key":"9814_CR46","doi-asserted-by":"publisher","first-page":"2835","DOI":"10.1109\/TIT.2015.2412945","volume":"61","author":"J Jiao","year":"2015","unstructured":"Jiao J, Venkat K, Han Y, Weissman T (2015) Minimax estimation of functionals of discrete distributions. IEEE Trans Inf Theory 61(5):2835\u20132885","journal-title":"IEEE Trans Inf Theory"},{"key":"9814_CR47","first-page":"171","volume":"14","author":"R Karthika","year":"2015","unstructured":"Karthika R, Visalakshi P (2015) A hybrid aco based feature selection method for email spam classification. WSEAS Trans Comput 14:171\u2013177","journal-title":"WSEAS Trans Comput"},{"key":"9814_CR48","doi-asserted-by":"crossref","unstructured":"Khonji M, Jones A, Iraqi Y (2011) A study of feature subset evaluators and feature subset searching methods for phishing classification. In: Proceedings of the 8th annual collaboration, electronic messaging, anti-abuse and spam conference. ACM, pp 135\u2013144 (2011)","DOI":"10.1145\/2030376.2030392"},{"key":"9814_CR49","first-page":"1","volume-title":"Lagrange multipliers without permanent scarring","author":"D Klein","year":"2004","unstructured":"Klein D (2004) Lagrange multipliers without permanent scarring. University of California at Berkeley, Computer Science Division, Berkeley, pp 1\u201311"},{"issue":"4","key":"9814_CR50","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1037\/met0000105","volume":"21","author":"M Kosinski","year":"2016","unstructured":"Kosinski M, Wang Y, Lakkaraju H, Leskovec J (2016) Mining big data to extract patterns and predict real-life outcomes. Psychol Methods 21(4):493","journal-title":"Psychol Methods"},{"issue":"5","key":"9814_CR51","first-page":"874","volume":"23","author":"S Kumar","year":"2015","unstructured":"Kumar S, Arumugam S (2015) A probabilistic neural network based classification of spam mails using particle swarm optimization feature selection. Middle-East J Sci Res 23(5):874\u2013879","journal-title":"Middle-East J Sci Res"},{"key":"9814_CR52","doi-asserted-by":"publisher","first-page":"421","DOI":"10.1016\/j.ins.2014.02.114","volume":"277","author":"C Laorden","year":"2014","unstructured":"Laorden C, Ugarte-Pedrero X, Santos I, Sanz B, Nieves J, Bringas PG (2014) Study on the effectiveness of anomaly detection for spam filtering. Inf Sci 277:421\u2013444","journal-title":"Inf Sci"},{"key":"9814_CR53","unstructured":"Louppe G, Wehenkel L, Sutera A, Geurts P (2013) Understanding variable importances in forests of randomized trees. In: Advances in neural information processing systems, pp 431\u2013439"},{"key":"9814_CR54","doi-asserted-by":"publisher","DOI":"10.1002\/meet.14504201146","author":"CP Lueg","year":"2005","unstructured":"Lueg CP (2005) From spam filtering to information retrieval and back: seeking conceptual foundations for spam filtering. Proc Am Soc Inf Sci Technol. https:\/\/doi.org\/10.1002\/meet.14504201146","journal-title":"Proc Am Soc Inf Sci Technol"},{"key":"9814_CR55","unstructured":"Ma L, Yearwood J, Watters P (2009) Establishing phishing provenance using orthographic features. In: eCrime researchers summit, eCRIME\u201909. IEEE, pp 1\u201310"},{"key":"9814_CR56","doi-asserted-by":"crossref","unstructured":"Mendez JR, Fdez-Riverola F, Diaz F, Iglesias EL, Corchado JM (2006) A comparative performance study of feature selection methods for the anti-spam filtering domain. In: Industrial conference on data mining. Springer, pp 106\u2013120","DOI":"10.1007\/11790853_9"},{"key":"9814_CR57","volume-title":"Machine learning: an artificial intelligence approach","author":"RS Michalski","year":"2013","unstructured":"Michalski RS, Carbonell JG, Mitchell TM (2013) Machine learning: an artificial intelligence approach. Springer, New York"},{"key":"9814_CR58","unstructured":"Mohammad RM, Thabtah F, McCluskey L (2015) Phishing websites features. (Unpublished). http:\/\/eprints.hud.ac.uk\/24330\/6\/RamiPhishing\\_Websites\\_Feature.pdf"},{"key":"9814_CR59","unstructured":"Mousavi A, Ayremlou A (2011) Bayesian spam classifier. http:\/\/cs229.stanford.edu"},{"issue":"3","key":"9814_CR60","doi-asserted-by":"publisher","first-page":"691","DOI":"10.1093\/biomet\/78.3.691","volume":"78","author":"NJ Nagelkerke","year":"1991","unstructured":"Nagelkerke NJ et al (1991) A note on a general definition of the coefficient of determination. Biometrika 78(3):691\u2013692","journal-title":"Biometrika"},{"key":"9814_CR61","unstructured":"Nazario J (2018) Phishing corpus. https:\/\/drive.google.com\/open?id=0B3rX15hRO_71Tl9iOHRkdlEwZVE. Accessed 12 Oct 2018"},{"issue":"5","key":"9814_CR62","doi-asserted-by":"publisher","first-page":"61","DOI":"10.3390\/electronics7050061","volume":"7","author":"S Netsanet","year":"2018","unstructured":"Netsanet S, Zhang J, Zheng D (2018) Bagged decision trees based scheme of microgrid protection using windowed fast fourier and wavelet transforms. Electronics 7(5):61","journal-title":"Electronics"},{"key":"9814_CR63","unstructured":"Norte\u00a0Sosa J (2010) Spam classification using machine learning techniques-sinespam. Master\u2019s thesis, Universitat Polit\u00e8cnica de Catalunya"},{"key":"9814_CR64","unstructured":"Ott M, Choi Y, Cardie C, Hancock JT (2011) Finding deceptive opinion spam by any stretch of the imagination. In: Proceedings of the 49th annual meeting of the association for computational linguistics: human language technologies, vol 1. Association for Computational Linguistics, pp 309\u2013319"},{"key":"9814_CR65","unstructured":"Palanisamy C, Kumaresan T, Varalakshmi S (2016) Combined techniques for detecting email spam using negative selection and particle swarm optimization. Int J Adv Res Trends Eng Technol 3(2)"},{"key":"9814_CR66","doi-asserted-by":"crossref","unstructured":"Pan Y, Ding X (2006) Anomaly based web phishing page detection. In: Null. IEEE, pp 381\u2013392 (2006)","DOI":"10.1109\/ACSAC.2006.13"},{"issue":"11","key":"9814_CR67","doi-asserted-by":"publisher","first-page":"559","DOI":"10.1080\/14786440109462720","volume":"2","author":"K Pearson","year":"1901","unstructured":"Pearson K (1901) Liii on lines and planes of closest fit to systems of points in space. Lond Edinburgh Dublin Philos Mag J Sci 2(11):559\u2013572","journal-title":"Lond Edinburgh Dublin Philos Mag J Sci"},{"issue":"1","key":"9814_CR68","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1093\/biomet\/13.1.25","volume":"13","author":"K Pearson","year":"1920","unstructured":"Pearson K (1920) Notes on the history of correlation. Biometrika 13(1):25\u201345","journal-title":"Biometrika"},{"key":"9814_CR69","doi-asserted-by":"crossref","unstructured":"Pelletier L, Almhana J, Choulakian V (2004) Adaptive filtering of spam. In: Proceedingsm second annual conference on communication networks and services research. IEEE, pp 218\u2013224 (2004)","DOI":"10.1109\/DNSR.2004.1344731"},{"issue":"8","key":"9814_CR70","doi-asserted-by":"publisher","first-page":"1226","DOI":"10.1109\/TPAMI.2005.159","volume":"27","author":"H Peng","year":"2005","unstructured":"Peng H, Long F, Ding C (2005) Feature selection based on mutual information criteria of max-dependency, max-relevance, and min-redundancy. IEEE Trans Pattern Anal Mach Intell 27(8):1226\u20131238","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"9814_CR71","doi-asserted-by":"crossref","unstructured":"Rajamohana SP, Umamaheswari K, Abirami B (2017) Adaptive binary flower pollination algorithm for feature selection in review spam detection. In: 2017 International conference on innovations in green energy and healthcare technologies (IGEHT). IEEE, pp 1\u20134 (2017)","DOI":"10.1109\/IGEHT.2017.8094094"},{"key":"9814_CR72","unstructured":"Renuka DK, Visalakshi P, Sankar T (2015) Improving e-mail spam classification using ant colony optimization algorithm. Int J Comput Appl 22\u201326"},{"issue":"2","key":"9814_CR73","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1016\/j.chemolab.2005.06.010","volume":"80","author":"F Rossi","year":"2006","unstructured":"Rossi F, Lendasse A, Fran\u00e7ois D, Wertz V, Verleysen M (2006) Mutual information for the selection of relevant variables in spectrometric nonlinear modelling. Chem Intell Lab Syst 80(2):215\u2013226","journal-title":"Chem Intell Lab Syst"},{"key":"9814_CR74","unstructured":"Sah UK, Parmar N (2017) An approach for malicious spam detection in email with comparison of different classifiers"},{"issue":"3","key":"9814_CR75","doi-asserted-by":"publisher","first-page":"e0118432","DOI":"10.1371\/journal.pone.0118432","volume":"10","author":"T Saito","year":"2015","unstructured":"Saito T, Rehmsmeier M (2015) The precision-recall plot is more informative than the roc plot when evaluating binary classifiers on imbalanced datasets. PloS ONE 10(3):e0118432","journal-title":"PloS ONE"},{"key":"9814_CR76","unstructured":"Sakkis G, Androutsopoulos I, Paliouras G, Karkaletsis V, Spyropoulos CD, Stamatopoulos P (2001) Stacking classifiers for anti-spam filtering of e-mail. arXiv preprint cs\/0106040"},{"key":"9814_CR77","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1016\/S0065-2458(08)00603-7","volume":"74","author":"EP Sanz","year":"2008","unstructured":"Sanz EP, Hidalgo JMG, P\u00e9rez JCC (2008) Email spam filtering. Adv Comput 74:45\u2013114","journal-title":"Adv Comput"},{"key":"9814_CR78","doi-asserted-by":"crossref","unstructured":"Sculley D, Wachman GM (2007) Relaxed online svms for spam filtering. In: Proceedings of the 30th annual international ACM SIGIR conference on research and development in information retrieval. ACM, pp 415\u2013422 (2007)","DOI":"10.1145\/1277741.1277813"},{"key":"9814_CR79","doi-asserted-by":"crossref","unstructured":"Shams R, Mercer RE (2013) Classifying spam emails using text and readability features. In: 2013 IEEE 13th international conference on data mining (ICDM). IEEE, pp 657\u2013666","DOI":"10.1109\/ICDM.2013.131"},{"key":"9814_CR80","unstructured":"Sharma AK, Prajapat SK, Aslam M (2014) A comparative study between na\u00efve bayes and neural network (mlp) classifier for spam email detection. Int J Comput Appl"},{"issue":"6","key":"9814_CR81","first-page":"28","volume":"136","author":"A Sharma","year":"2016","unstructured":"Sharma A, Suryawanshi A (2016) A novel method for detecting spam email using knn classification with spearman correlation as distance measure. Int J Comput Appl 136(6):28\u201335","journal-title":"Int J Comput Appl"},{"issue":"8","key":"9814_CR82","first-page":"2956","volume":"4","author":"JN Shrivastava","year":"2013","unstructured":"Shrivastava JN, Bindu MH (2013) E-mail classification using genetic algorithm with heuristic fitness function. Int J Comput Trends Technol 4(8):2956\u20132961","journal-title":"Int J Comput Trends Technol"},{"key":"9814_CR83","unstructured":"Silipo R, Adae I, Hart A, Berthold M (2014) Seven techniques for data dimensionality reduction. Report, KNIME. com AG. Accessed 12 Jan 2018"},{"key":"9814_CR84","unstructured":"Symantec (2018) Internet security threat report. http:\/\/images.mktgassets.symantec.com\/Web\/Symantec\/%7B3a70beb8-c55d-4516-98ed-1d0818a42661%7D_ISTR23_Main-FINAL-APR10.pdf?aid=elq_. Accessed 09 Mar 2018"},{"key":"9814_CR85","doi-asserted-by":"crossref","unstructured":"Toolan F, Carthy J (2009) Phishing detection using classifier ensembles. In: eCrime researchers summit, eCRIME\u201909. IEEE, pp 1\u20139","DOI":"10.1109\/ECRIME.2009.5342607"},{"key":"9814_CR86","doi-asserted-by":"crossref","unstructured":"Toolan F, Carthy J (2010) Feature selection for spam and phishing detection. In: eCrime researchers summit (eCrime). IEEE, pp 1\u201312 (2010)","DOI":"10.1109\/ecrime.2010.5706696"},{"issue":"1","key":"9814_CR87","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/S0164-1212(99)00062-X","volume":"49","author":"CR Turner","year":"1999","unstructured":"Turner CR, Fuggetta A, Lavazza L, Wolf AL (1999) A conceptual basis for feature engineering. J Syst Softw 49(1):3\u201315","journal-title":"J Syst Softw"},{"key":"9814_CR88","unstructured":"Tyagi A (2016) Content based spam classification-a deep learning approach. Ph.D. thesis, University of Calgary"},{"issue":"1","key":"9814_CR89","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1007\/s00521-013-1368-0","volume":"24","author":"JR Vergara","year":"2014","unstructured":"Vergara JR, Est\u00e9vez PA (2014) A review of feature selection methods based on mutual information. Neural Comput Appl 24(1):175\u2013186","journal-title":"Neural Comput Appl"},{"issue":"3","key":"9814_CR90","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2200\/S00861ED1V01Y201806AIM039","volume":"12","author":"Y Vorobeychik","year":"2018","unstructured":"Vorobeychik Y, Kantarcioglu M (2018) Adversarial machine learning. Synth Lect Artifi Intell Mach Learn 12(3):1\u2013169","journal-title":"Synth Lect Artifi Intell Mach Learn"},{"key":"9814_CR91","unstructured":"Wang XL et\u00a0al (2005) Learning to classify email: a survey. In: 2005 International conference on machine learning and cybernetics, vol\u00a09. IEEE, pp 5716\u20135719 (2005)"},{"key":"9814_CR92","unstructured":"Wang Z, Josephson WK, Lv Q, Charikar M, Li K (2007) Filtering image spam with near-duplicate detection. In: CEAS (2007)"},{"issue":"1\u20133","key":"9814_CR93","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/0169-7439(87)80084-9","volume":"2","author":"S Wold","year":"1987","unstructured":"Wold S, Esbensen K, Geladi P (1987) Principal component analysis. Chem Intell Lab Syst 2(1\u20133):37\u201352","journal-title":"Chem Intell Lab Syst"},{"key":"9814_CR94","doi-asserted-by":"crossref","unstructured":"Wu J, Deng T (2008) Research in anti-spam method based on bayesian filtering. In: 2008 IEEE pacific-asia workshop on computational intelligence and industrial application, vol\u00a02. IEEE, pp 887\u2013891 (2008)","DOI":"10.1109\/PACIIA.2008.180"},{"key":"9814_CR95","unstructured":"Yang HH, Moody J (2000) Data visualization and feature selection: new algorithms for nongaussian data. In: Advances in neural information processing systems, pp 687\u2013693 (2000)"},{"issue":"7","key":"9814_CR96","doi-asserted-by":"publisher","first-page":"68","DOI":"10.5815\/ijmecs.2016.07.08","volume":"8","author":"M Zavvar","year":"2016","unstructured":"Zavvar M, Rezaei M, Garavand S (2016) Email spam detection using combination of particle swarm optimization and artificial neural network and support vector machine. Int J Mod Educ Comput Sci 8(7):68","journal-title":"Int J Mod Educ Comput Sci"},{"key":"9814_CR100","doi-asserted-by":"crossref","unstructured":"Zhuang W, Jiang Q, Xiong T (2012) An intelligent anti-phishing strategy model for phishing website detection. In: 32nd International conference on distributed computing systems workshops (ICDCSW). IEEE, pp 51\u201356","DOI":"10.1109\/ICDCSW.2012.66"},{"issue":"7","key":"9814_CR97","doi-asserted-by":"publisher","first-page":"845","DOI":"10.1016\/j.im.2014.08.003","volume":"51","author":"D Zhang","year":"2014","unstructured":"Zhang D, Yan Z, Jiang H, Kim T (2014) A domain-feature enhanced classification model for the detection of chinese phishing e-business websites. Inf Manag 51(7):845\u2013853","journal-title":"Inf Manag"},{"key":"9814_CR98","unstructured":"Zhao W, Zhang Z (2005) An email classification model based on rough set theory. In: Proceedings of the 2005 international conference on active media technology. IEEE, pp 403\u2013408"},{"key":"9814_CR99","doi-asserted-by":"crossref","unstructured":"Zhong N, Liu J, Yao Y, Wu J, Lu S, Qin Y, Li K, Wah B (2006) Spam filtering and email-mediated applications. In: International workshop on web intelligence meets brain informatics. Springer, pp 1\u201331 (2006)","DOI":"10.1007\/978-3-540-77028-2_1"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09814-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10462-020-09814-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-020-09814-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,2,21]],"date-time":"2021-02-21T00:40:26Z","timestamp":1613868026000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10462-020-09814-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,2,22]]},"references-count":100,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2020,10]]}},"alternative-id":["9814"],"URL":"https:\/\/doi.org\/10.1007\/s10462-020-09814-9","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"value":"0269-2821","type":"print"},{"value":"1573-7462","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,2,22]]},"assertion":[{"value":"22 February 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}