{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,12]],"date-time":"2025-10-12T20:19:37Z","timestamp":1760300377027,"version":"3.28.0"},"reference-count":51,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1109\/bigdata47090.2019.9006282","type":"proceedings-article","created":{"date-parts":[[2020,2,25]],"date-time":"2020-02-25T06:05:34Z","timestamp":1582610734000},"page":"4299-4308","source":"Crossref","is-referenced-by-count":13,"title":["Detecting Web Spam in Webgraphs with Predictive Model Analysis"],"prefix":"10.1109","author":[{"given":"Naw Safrin","family":"Sattar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shaikh","family":"Arifuzzaman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Minhaz F.","family":"Zibran","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Md Mohiuddin","family":"Sakib","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","first-page":"41","article-title":"An empirical study of the naive bayes classifier","volume":"3","author":"rish","year":"2001","journal-title":"IJCAI 2001 Workshop on Empirical Methods in Artificial Intelligence"},{"journal-title":"Introduction to Naive Bayes Classification Algorithm in Python and R","year":"0","author":"jain","key":"ref38"},{"journal-title":"Scikit- Learn Support Vector Machines","year":"0","key":"ref33"},{"journal-title":"Kernel functions-introduction to svm kernel & examples","year":"0","key":"ref32"},{"key":"ref31","first-page":"1","article-title":"Cs229 lecture notes","volume":"1","author":"ng","year":"2000","journal-title":"CS229 Lecture Notes"},{"journal-title":"How to use classification machine learning algorithms in weka","year":"0","author":"brownlee","key":"ref30"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2006.09.004"},{"journal-title":"K-nearest Neighbor Algorithm","year":"0","key":"ref36"},{"key":"ref35","first-page":"986","article-title":"Knn model-based approach in classification","author":"guo","year":"2003","journal-title":"OTM Confederated InternationalConferences&#x201D; On the Move to Meaningful Internet Systems&#x201D;"},{"journal-title":"Understanding Support Vector Machine algorithm from examples (along with code)","year":"0","author":"ray","key":"ref34"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2015.10.069"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/GLOCOM.2018.8647294"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4302-5990-9_3"},{"key":"ref2","article-title":"Using rank propagation and probabilistic counting for link-based spam detection","volume":"6","author":"becchetti","year":"2006","journal-title":"Proc of WebKDD"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/1401890.1401898"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/1135777.1135794"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/1326561.1326563"},{"key":"ref21","first-page":"1","article-title":"Blocking blog spam with language model disagreement","volume":"5","author":"mishne","year":"2005","journal-title":"AIRWeb"},{"key":"ref24","article-title":"Web spam detection using multiple kernels in twin support vector machine","author":"mohammadi","year":"2016","journal-title":"arXiv preprint arXiv 1605 09090"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/1277741.1277814"},{"journal-title":"Classification of malicious web pages through a j48 decision tree a na&#x00EF;ve bayes a rbf network and a random forest classifier for webspam detection","year":"2017","author":"iqbal","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1155\/2019\/6587020"},{"key":"ref50","article-title":"Api design for machine learning software: experiences from the scikit-learn project","author":"buitinck","year":"2013","journal-title":"arXiv preprint arXiv 1309 0238"},{"key":"ref51","article-title":"The weka workbench. online appendix for&#x201D; data mining: Practical machine learning tools and techniques","author":"eibe","year":"2016","journal-title":"Morgan Kaufmann"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/792550.792553"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2005.352"},{"journal-title":"Decision Trees and Random Forests for Classification and Regression","year":"0","author":"lan","key":"ref40"},{"key":"ref12","article-title":"Web spam taxonomy","author":"gyongyi","year":"2005","journal-title":"First International Workshop on Adversarial Information Retrieval on the Web (AIRWeb 2005)"},{"key":"ref13","first-page":"335","article-title":"Detecting spam bots in online social networking sites: a machine learning approach","author":"wang","year":"2010","journal-title":"IFIP Annual Conference on Data and Applications Security and Privacy"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2018.2866066"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"16","DOI":"10.3390\/s18010016","article-title":"Warcprocessor: An integrative tool for building and management of web spam corpora","volume":"18","author":"call\u00f3n","year":"2018","journal-title":"SENSORS"},{"key":"ref16","first-page":"2825","article-title":"Scikit-learn: Machine learning in python","volume":"12","author":"pedregosa","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/1656274.1656278"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/1964114.1964121"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/1552303.1552306"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/1189740.1189744"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/1189702.1189703"},{"key":"ref6","first-page":"17","article-title":"Improving cloaking detection using search query popularity and monetizability","author":"chellapilla","year":"2006","journal-title":"AIRWeb"},{"key":"ref5","first-page":"23","article-title":"Recognizing nepotistic links on the web","author":"davisons","year":"2000","journal-title":"Artificial Intelligence for Web search"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/1531914.1531918"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/1531914.1531928"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/2567948.2577304"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/1076034.1076037"},{"journal-title":"Webspam-uk2007 (current dataset)","year":"0","author":"castillo","key":"ref46"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btg419"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/1963405.1963488"},{"key":"ref47","first-page":"595","article-title":"The WebGraph framework I: Compression techniques","author":"boldi","year":"2004","journal-title":"Proc of the Thirteenth International World Wide Web Conference (WWW 2004)"},{"journal-title":"Train\/test split and cross validation in python towards data science","year":"0","author":"bronshtein","key":"ref42"},{"key":"ref41","first-page":"18","article-title":"Classification and regression by randomforest","volume":"2","author":"liaw","year":"2002","journal-title":"R News"},{"key":"ref44","volume":"112","author":"james","year":"2013","journal-title":"An Introduction to Statistical Learning with Applications in R (Springer Texts in Statistics)"},{"journal-title":"A Gentle Introduction to k-fold Cross-Validation","year":"0","author":"brownlee","key":"ref43"}],"event":{"name":"2019 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2019,12,9]]},"location":"Los Angeles, CA, USA","end":{"date-parts":[[2019,12,12]]}},"container-title":["2019 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8986695\/9005444\/09006282.pdf?arnumber=9006282","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,17]],"date-time":"2022-07-17T21:47:57Z","timestamp":1658094477000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9006282\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,12]]},"references-count":51,"URL":"https:\/\/doi.org\/10.1109\/bigdata47090.2019.9006282","relation":{},"subject":[],"published":{"date-parts":[[2019,12]]}}}