{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T13:06:14Z","timestamp":1781701574536,"version":"3.54.5"},"reference-count":79,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"CAPES\u2013Brazilian Higher Education Personnel Improvement Coordination","award":["PROAP\/UnB\/PPGEE"],"award-info":[{"award-number":["PROAP\/UnB\/PPGEE"]}]},{"name":"CAPES\u2013Brazilian Higher Education Personnel Improvement Coordination","award":["23038.007604\/2014-69 FORTE"],"award-info":[{"award-number":["23038.007604\/2014-69 FORTE"]}]},{"name":"CAPES\u2013Brazilian Higher Education Personnel Improvement Coordination","award":["88887.144009\/2017-00 PROBRAL"],"award-info":[{"award-number":["88887.144009\/2017-00 PROBRAL"]}]},{"name":"CNPq\u2013Brazilian National Research Council","award":["312180\/2019-5 PQ-2"],"award-info":[{"award-number":["312180\/2019-5 PQ-2"]}]},{"name":"CNPq\u2013Brazilian National Research Council","award":["303343\/2017-6 PQ-2"],"award-info":[{"award-number":["303343\/2017-6 PQ-2"]}]},{"name":"CNPq\u2013Brazilian National Research Council","award":["BRICS 2017-591 LargEWiN"],"award-info":[{"award-number":["BRICS 2017-591 LargEWiN"]}]},{"name":"CNPq\u2013Brazilian National Research Council","award":["465741\/2014-2 INCT in cybersecurity"],"award-info":[{"award-number":["465741\/2014-2 INCT in cybersecurity"]}]},{"name":"FAP-DF\u2013Brazilian Federal District Research Support Foundation","award":["0193.001366\/2016 UIoT"],"award-info":[{"award-number":["0193.001366\/2016 UIoT"]}]},{"name":"FAP-DF\u2013Brazilian Federal District Research Support Foundation","award":["0193.001365\/2016 SSDDC"],"award-info":[{"award-number":["0193.001365\/2016 SSDDC"]}]},{"name":"Brazilian Ministry of the Economy","award":["005\/2016 DIPLA"],"award-info":[{"award-number":["005\/2016 DIPLA"]}]},{"name":"Brazilian Ministry of the Economy","award":["083\/2016 ENAP"],"award-info":[{"award-number":["083\/2016 ENAP"]}]},{"name":"Institutional Security Office of the Presidency of Brazil","award":["ABIN 002\/2017"],"award-info":[{"award-number":["ABIN 002\/2017"]}]},{"name":"Administrative Council for Economic Defense","award":["CADE 08700.000047\/2019-14"],"award-info":[{"award-number":["CADE 08700.000047\/2019-14"]}]},{"name":"General Attorney of the Union","award":["AGU 697.935\/2019"],"award-info":[{"award-number":["AGU 697.935\/2019"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2020]]},"DOI":"10.1109\/access.2020.3043396","type":"journal-article","created":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T02:30:34Z","timestamp":1607567434000},"page":"223529-223547","source":"Crossref","is-referenced-by-count":49,"title":["The Answer is in the Text: Multi-Stage Methods for Phishing Detection Based on Feature Engineering"],"prefix":"10.1109","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2917-3605","authenticated-orcid":false,"given":"Eder Souza","family":"Gualberto","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1101-3029","authenticated-orcid":false,"given":"Rafael Timoteo","family":"De Sousa","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0512-374X","authenticated-orcid":false,"given":"Thiago Pereira","family":"De Brito Vieira","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8616-4924","authenticated-orcid":false,"given":"Joao Paulo Carvalho Lustosa","family":"Da Costa","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Claudio Gottschalg","family":"Duque","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref73","article-title":"How many components should be retained from a multivariate time series PCA?","author":"rea","year":"2016","journal-title":"arXiv 1610 03588"},{"key":"ref72","author":"kim","year":"1978","journal-title":"Factor Analysis Statistical Methods and Practical Issues"},{"key":"ref71","author":"manning","year":"1999","journal-title":"Foundations of Statistical Natural Language Processing"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.4169\/amer.math.monthly.119.10.838"},{"key":"ref76","author":"osuna","year":"1997","journal-title":"Support vector machines Training and applications"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1080\/01638539809545028"},{"key":"ref39","first-page":"10","article-title":"Distributed representation using target classes: Bag of tricks for security and privacy analytics Amrita-Nlpiwspa-2018","volume":"2124","author":"barathi ganesh","year":"2018","journal-title":"Proc CEUR Workshop Proceedings"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1162\/089976698300017197"},{"key":"ref38","author":"vazhayil","year":"2017","journal-title":"Ped-ML Phishing Email Detection Using Classical Machine Learning Techniques Censec Amrita"},{"key":"ref78","first-page":"40","article-title":"Deepanti-phishnet: Applying deep neural networks for phishing email detection cen-aisecurity@iwspa-2018","author":"kb","year":"2010","journal-title":"Proc IWSPA"},{"key":"ref79","first-page":"1","article-title":"Anti-phishing shared task pilot at the 4th ACM IWSPA","author":"baki","year":"2018","journal-title":"Proc IWSPA-AP"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ISI.2010.5484762"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.5815\/ijieeb.2015.02.08"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1155\/2014\/425731"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33167-1_47"},{"key":"ref37","first-page":"21","article-title":"A machine learning approach towards phishing email detection cen-security Iwspa 2018","volume":"2124","author":"harikrishnan","year":"2018","journal-title":"Proc CEUR Workshop Proceedings"},{"key":"ref36","first-page":"64","article-title":"Machine learning based phishing e-mail detection security-ceneamrita","author":"unnithan","year":"2018","journal-title":"Proc CEUR Workshop Proceedings"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2012.12.002"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1186\/1687-417X-2012-1"},{"key":"ref60","first-page":"1157","article-title":"An introduction to variable and feature selection","volume":"3","author":"guyon","year":"2003","journal-title":"J Mach Learn Res"},{"key":"ref62","author":"alpaydin","year":"2014","journal-title":"Introduction to Machine Learning"},{"key":"ref61","first-page":"1","article-title":"Feature selection and feature extraction in pattern analysis: A literature review","volume":"abs 1905 2845","author":"ghojogh","year":"2019","journal-title":"CoRR"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ecrime.2010.5706696"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.5769\/J201202001"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.jnca.2012.05.009"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1016\/j.jnca.2017.04.012"},{"key":"ref65","author":"shlens","year":"2005","journal-title":"A Tutorial on Principal Component Analysis"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.5121\/ijnsa.2016.8405"},{"key":"ref66","author":"jolliffe","year":"2002","journal-title":"Principal Component Analysis"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1037\/0033-295X.104.2.211"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9"},{"key":"ref2","year":"2020","journal-title":"Cisco Annual Internet Report (2018-2023) White Paper"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.4324\/9780203936399"},{"key":"ref1","author":"stats","year":"2020","journal-title":"Internet Usage Statistics&#x2014;The Internet Big Picture World Internet Users and 2020 Population Stats"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.3115\/1613715.1613831"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s11036-017-0839-4"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1186\/s40537-014-0007-7"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/1242572.1242660"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.5769\/C2013007"},{"key":"ref26","first-page":"1","article-title":"Multi stage phishing email classification","volume":"83","author":"daeef","year":"2016","journal-title":"J Theor Appl Inf Technol"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.24846\/v22i1y201307"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2702187"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-020-09814-9"},{"key":"ref59","author":"bishop","year":"2006","journal-title":"Pattern Recognition and Machine Learning"},{"key":"ref58","author":"duda","year":"2001","journal-title":"Pattern Classification"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.5120\/ijca2016908317"},{"key":"ref56","first-page":"1","article-title":"Using TF-IDF to determine word relevance in document queries","author":"ramos","year":"2003","journal-title":"Proc 1st Instruct Conf Mach Learn"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-72347-1"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-demos.14"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511809071"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-36530-0_11"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TDSC.2018.2864993"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/1299015.1299021"},{"key":"ref40","first-page":"39","article-title":"Deepanti-phishnet: Applying deep neural networks for phishing email detection cen-aisecurityiwspa ?2018","volume":"2124","author":"vinayakumar","year":"2018","journal-title":"Proc CEUR Workshop Proceedings"},{"key":"ref12","first-page":"51","article-title":"Detecting phishing e-mail using machine learning techniques","author":"nidhin a unnithan","year":"2018","journal-title":"Proc ACM Conf Data Appl Secur Privacy"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3190645.3190719"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.2200\/S00762ED1V01Y201703HLT037"},{"key":"ref15","article-title":"Speech and language processing: An introduction to natural language processing","author":"jurafsky","year":"2009","journal-title":"Computational Linguistics and Speech Recognition"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1613\/jair.2934"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-56991-8_77"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/11494669_93"},{"key":"ref19","first-page":"653","article-title":"Similarity learning for high-dimensional sparse data","volume":"38","author":"liu","year":"2015","journal-title":"Proc Int Conf Artif Intell Statist"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2018.03.050"},{"key":"ref3","year":"2020","journal-title":"Phishing Activity Trends Reports 1st Quarter 2020 Plus Covid-19 Coverage"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2017.04.006"},{"key":"ref5","first-page":"547","article-title":"Detection of phishing e-mail","volume":"2","author":"singh","year":"2011","journal-title":"Int J Comput Sci Technol"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCS45141.2019.9065639"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/SURV.2013.030713.00020"},{"key":"ref49","year":"2020","journal-title":"The Apache Spamassassin Public Corpus"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/s13042-018-00906-1"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2913705"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-39303-8_17"},{"key":"ref48","author":"nazario","year":"2020","journal-title":"Phishing Corpus"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2989126"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-50420-5_18"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/SAI.2017.8252096"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2837889"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-020-09814-9"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6287639\/8948470\/09288667.pdf?arnumber=9288667","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,12,17]],"date-time":"2021-12-17T19:55:27Z","timestamp":1639770927000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9288667\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"references-count":79,"URL":"https:\/\/doi.org\/10.1109\/access.2020.3043396","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020]]}}}