{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T17:22:00Z","timestamp":1781716920215,"version":"3.54.5"},"publisher-location":"Berlin, Heidelberg","reference-count":35,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783540360360","type":"print"},{"value":"9783540360377","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2006]]},"DOI":"10.1007\/11790853_9","type":"book-chapter","created":{"date-parts":[[2006,7,12]],"date-time":"2006-07-12T04:22:02Z","timestamp":1152678122000},"page":"106-120","source":"Crossref","is-referenced-by-count":51,"title":["A Comparative Performance Study of Feature Selection Methods for the Anti-spam Filtering Domain"],"prefix":"10.1007","author":[{"given":"J. R.","family":"M\u00e9ndez","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"F.","family":"Fdez-Riverola","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"F.","family":"D\u00edaz","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"E. L.","family":"Iglesias","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"J. M.","family":"Corchado","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","reference":[{"key":"9_CR1","unstructured":"Spam statistics, http:\/\/www.theregister.co.uk\/security\/spam\/"},{"key":"9_CR2","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1023\/A:1008287121180","volume":"7","author":"D.W. Oard","year":"1997","unstructured":"Oard, D.W.: The state of the art in text filtering. User Modeling and User-Adapted Interaction\u00a07, 141\u2013178 (1997)","journal-title":"User Modeling and User-Adapted Interaction"},{"key":"9_CR3","unstructured":"Wittel, G.L., Wu, S.F.: On Attacking Statistical Spam Filters. In: Proc. of the First Conference on E-mail and Anti-Spam CEAS (2004)"},{"key":"9_CR4","unstructured":"Androutsopoulos, I., Paliouras, G., Michelakis, E.: Learning to Filter Unsolicited Commercial E-Mail. Technical Report 2004\/2, NCSR Demokritos (2004)"},{"key":"9_CR5","unstructured":"M\u00e9ndez, J.R., Iglesias, E.L., Fdez-Riverola, F., D\u00edaz, F., Corchado, J.M.: Analyzing the Impact of Corpus Preprocessing on Anti-Spam Filtering Software. Research on Computing Science (to appear, 2005)"},{"key":"9_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1007\/3-540-45006-8_11","volume-title":"Case-Based Reasoning Research and Development","author":"J.M. Corchado","year":"2003","unstructured":"Corchado, J.M., Corchado, E.S., Aiken, J., Fyfe, C., Fdez-Riverola, F., Glez-Bedia, M.: Maximum Likelihood Hebbian Learning Based Retrieval Method for CBR Systems. In: Ashley, K.D., Bridge, D.G. (eds.) ICCBR 2003. LNCS, vol.\u00a02689, pp. 107\u2013121. Springer, Heidelberg (2003)"},{"key":"9_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1007\/978-3-540-28631-8_39","volume-title":"Advances in Case-Based Reasoning","author":"J.M. Corchado","year":"2004","unstructured":"Corchado, J.M., Aiken, J., Corchado, E., Lefevre, N., Smyth, T.: Quantifying the ocean\u2019s CO2 budget with a coHeL-IBR system. In: Funk, P., Gonz\u00e1lez Calero, P.A. (eds.) ECCBR 2004. LNCS, vol.\u00a03155, pp. 533\u2013546. Springer, Heidelberg (2004)"},{"key":"9_CR8","doi-asserted-by":"crossref","unstructured":"Fdez-Riverola, F., Lorenzo, E.L., D\u00edaz, F., M\u00e9ndez, J.R., Corchado, J.M.: SpamHunting: An Instance-Based Reasoning System for Spam Labelling and Filtering. Decision Support Systems (to appear, 2006)","DOI":"10.1016\/j.dss.2006.11.012"},{"key":"9_CR9","unstructured":"Sahami, M., Dumais, S., Heckerman, D., Horvitz, E.: A Bayesian approach to filtering junk e-mail. In: Learning for Text Categorization \u2013 Papers from the AAAI Workshop, Technical Report WS-98-05, pp. 55\u201362 (1998)"},{"key":"9_CR10","unstructured":"Carreras, X., M\u00e0rquez, L.: Boosting trees for anti-spam e-mail filtering. In: Proc. of the 4th International Conference on Recent Advances in Natural Language Processing, pp. 58\u201364 (2001)"},{"key":"9_CR11","doi-asserted-by":"crossref","unstructured":"Vapnik, V.: The Nature of Statistical Learning Theory, 2nd edn. Statistics for Engineering and Information Science (1999)","DOI":"10.1007\/978-1-4757-3264-1"},{"key":"9_CR12","unstructured":"Delany, S.J., Cunningham, P., Coyle, L.: An Assessment of Case-base Reasoning for Spam Filtering. In: Proc. of Fifteenth Irish Conference on Artificial Intelligence and Cognitive Science: AICS 2004, pp. 9\u201318 (2004)"},{"key":"9_CR13","unstructured":"Yang, Y., Pedersen, J.O.: A comparative study on feature selection in text categorization. In: Proc. of the Fourteenth International Conference on Machine Learning: ICML 1997, pp. 412\u2013420 (1997)"},{"key":"9_CR14","volume-title":"Machine Learning","author":"T. Mitchell","year":"1996","unstructured":"Mitchell, T.: Machine Learning. Mc Graw Hill, New York (1996)"},{"key":"9_CR15","doi-asserted-by":"crossref","unstructured":"Dumais, S., Platt, J., Heckerman, D., Sahami, M.: Inductive learning algorithms and representations for text categorization. In: Proc. of the 7th International Conference on Information and Knowledge Management, pp. 229\u2013237 (1998)","DOI":"10.1145\/288627.288651"},{"key":"9_CR16","doi-asserted-by":"crossref","unstructured":"Church, K.W., Hanks, P.: Word association norms, mutual information and lexicography. In: Proc. of the ACL, vol.\u00a027, pp. 76\u201383 (1989)","DOI":"10.3115\/981623.981633"},{"issue":"1","key":"9_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F. Sebastiani","year":"2002","unstructured":"Sebastiani, F.: Machine Learning in Automated Text Categorization. ACM Computing Surveys\u00a034(1), 1\u201347 (2002)","journal-title":"ACM Computing Surveys"},{"issue":"5","key":"9_CR18","doi-asserted-by":"publisher","first-page":"1048","DOI":"10.1109\/72.788645","volume":"10","author":"H.D. Drucker","year":"1999","unstructured":"Drucker, H.D., Wu, D., Vapnik, V.: Support Vector Machines for spam categorization. IEEE Transactions on Neural Networks\u00a010(5), 1048\u20131054 (1999)","journal-title":"IEEE Transactions on Neural Networks"},{"key":"9_CR19","doi-asserted-by":"crossref","unstructured":"Platt, J.: Fast training of Support Vector Machines using Sequential Minimal Optimization. In: Sholkopf, B., Burges, C., Smola, A. (eds.) Advances in Kernel Methods \u2013 Support Vector Learning, pp. 185\u2013208 (1999)","DOI":"10.7551\/mitpress\/1130.003.0016"},{"issue":"2\/3","key":"9_CR20","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1023\/A:1007649029923","volume":"39","author":"R.E. Schapire","year":"2000","unstructured":"Schapire, R.E., Singer, Y.: BoosTexter: a boosting-based system for text categorization. Machine Learning\u00a039(2\/3), 135\u2013168 (2000)","journal-title":"Machine Learning"},{"key":"9_CR21","unstructured":"Tsymbal, A.: The problem of concept drift: definitions and related work, available at: http:\/\/www.cs.tcd.ie"},{"key":"9_CR22","unstructured":"Graham, P.: Better Bayesian filtering. In: Proc. of the MIT Spam Conference (2003)"},{"key":"9_CR23","unstructured":"Kolcz, A., Alspector, J.: SVM-based filtering of e-mail spam with content specific misclassification costs. In: Proc. of the ICDM Workshop on Text Mining (2001)"},{"key":"9_CR24","unstructured":"Hovold, J.: Na\u00efve Bayes Spam Filtering Using Word-Position-Based Attributes. In: Proc. of the Second Conference on Email and Anti-Spam CEAS 2005, http:\/\/www.ceas.cc\/papers-2005\/144.pdf"},{"key":"9_CR25","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"765","DOI":"10.1007\/3-540-36131-6_78","volume-title":"Advances in Artificial Intelligence - IBERAMIA 2002","author":"J. Gama","year":"2002","unstructured":"Gama, J., Castillo, G.: Adaptive Bayes. In: Garijo, F.J., Riquelme, J.-C., Toro, M. (eds.) IBERAMIA 2002. LNCS, vol.\u00a02527, pp. 765\u2013774. Springer, Heidelberg (2002)"},{"key":"9_CR26","unstructured":"Scholz, M., Klinkenberg, R.: An Ensemble Classifier for Drifting Concepts. In: Proc. of the Second International Workshop on Knowledge Discovery from Data Streams, pp. 53\u201364 (2005)"},{"key":"9_CR27","doi-asserted-by":"crossref","unstructured":"Syed, N.A., Liu, H., Sung, K.K.: Handling Concept Drifts in Incremental Learning with Support Vector Machines. In: Proc. of the fifth ACM SIGKDD international conference on Knowledge discovery and data mining, pp. 317\u2013321 (1999)","DOI":"10.1145\/312129.312267"},{"key":"9_CR28","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/3-540-45372-5_1","volume-title":"Principles of Data Mining and Knowledge Discovery","author":"I. Androutsopoulos","year":"2000","unstructured":"Androutsopoulos, I., Paliouras, G., Karkaletsis, V., Sakkis, G., Spyropoulos, C.D., Stamatopoulos, P.: Learning to Filter Spam E-Mail: A Comparison of a Na\u00efve Bayesian and a Memory-Based Approach. In: Zighed, A.D.A., Komorowski, J., \u017bytkow, J.M. (eds.) PKDD 2000. LNCS (LNAI), vol.\u00a01910, pp. 1\u201313. Springer, Heidelberg (2000)"},{"key":"9_CR29","unstructured":"Daelemans, W., Jakub, Z., Sloot, K., Bosh, A.: TiMBL. Tilburg Memory Based Learning, version 5.1, Reference Guide. ILK, Computational Linguistics, Tilburg University, http:\/\/ilk.uvt.nl\/software.html#timbl"},{"key":"9_CR30","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"51","DOI":"10.1007\/3-540-69351-3_3","volume-title":"Case-Based Reasoning Technology","author":"M. Lenz","year":"1998","unstructured":"Lenz, M., Auriol, E., Manago, M.: Diagnosis and Decision Support. In: Lenz, M., Bartsch-Sp\u00f6rl, B., Burkhard, H.-D., Wess, S. (eds.) Case-Based Reasoning Technology. LNCS, vol.\u00a01400, pp. 51\u201390. Springer, Heidelberg (1998)"},{"key":"9_CR31","volume-title":"Information Retrieval: Data Structures & Algorithms","author":"B. Frakes","year":"2000","unstructured":"Frakes, B., Baeza-Yates, R.: Information Retrieval: Data Structures & Algorithms. Prentice-Hall, Englewood Cliffs (2000)"},{"key":"9_CR32","unstructured":"NIST: National Institute of Science and Technology. Reuters corpora (2004), http:\/\/trec.nist.gov\/data\/reuters\/reuters.html"},{"key":"9_CR33","volume-title":"Introduction to modern information retrieval","author":"G. Salton","year":"1983","unstructured":"Salton, G., McGill, M.: Introduction to modern information retrieval. McGraw-Hill, New York (1983)"},{"issue":"1","key":"9_CR34","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1023\/A:1022948414856","volume":"6","author":"G. Sakkis","year":"2003","unstructured":"Sakkis, G., Androutsopoulos, I., Paliouras, G., Karkaletsis, V., Spyropoulos, C., Stamatopoulos, P.: A Memory-Based Approach to Anti-Spam Filtering for Mailing Lists. Information Retrieval\u00a06(1), 49\u201373 (2003)","journal-title":"Information Retrieval"},{"key":"9_CR35","unstructured":"Kohavi, R.: A study of cross-validation and bootstrap for accuracy estimation and model selection. In: Proc. of the 14th International Joint Conference on Artificial Intelligence: IJCAI 1995, pp. 1137\u20131143 (1995)"}],"container-title":["Lecture Notes in Computer Science","Advances in Data Mining. Applications in Medicine, Web Mining, Marketing, Image and Signal Mining"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/11790853_9.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,7]],"date-time":"2023-05-07T21:16:51Z","timestamp":1683494211000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/11790853_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2006]]},"ISBN":["9783540360360","9783540360377"],"references-count":35,"URL":"https:\/\/doi.org\/10.1007\/11790853_9","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2006]]}}}