{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T23:56:51Z","timestamp":1725494211565},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540769927"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-76993-4_14","type":"book-chapter","created":{"date-parts":[[2007,11,6]],"date-time":"2007-11-06T11:30:45Z","timestamp":1194348645000},"page":"159-170","source":"Crossref","is-referenced-by-count":4,"title":["Adaptive Email Spam Filtering Based on Information Theory"],"prefix":"10.1007","author":[{"given":"Xin","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Wenyuan","family":"Dai","sequence":"additional","affiliation":[]},{"given":"Gui-Rong","family":"Xue","sequence":"additional","affiliation":[]},{"given":"Yong","family":"Yu","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"14_CR1","unstructured":"Androutsopoulos, I., Koutsias, J., Chandrinos, K.V., Paliouras, G., Spyropoulos, C.D.: An Evaluation of Naive Bayesian Anti-Spam Filtering. In: Proceedings of the Workshop on Machine Learning in the New Information Age, 11th European Conference on Machine Learning (2000)"},{"key":"14_CR2","doi-asserted-by":"crossref","unstructured":"Androutsopoulos, I., Koutsias, J., Chandrinos, K.V., Spyropoulos, C.D.: An Experimental Comparison of Naive Bayesian and Keyword-Based Anti-Spam Filtering with Encrypted Person-al E-mail Messages. In: Proceedings of the 23rd Annual International ACM SIGIR Conference on Research and Development in Information Retrieval (2000)","DOI":"10.1145\/345508.345569"},{"key":"14_CR3","unstructured":"Bickel, S.: ECML-PKDD Discovery Challenge 2006 Overview. In: Proceedings of the ECML\/PKDD Discovery Challenge Workshop (2006)"},{"key":"14_CR4","doi-asserted-by":"crossref","unstructured":"Bickel, S., Scheffer, T.: Dirichlet-Enhanced Spam Filtering based on Biased Samples. Advances in Neural Information Processing Systems (2006)","DOI":"10.7551\/mitpress\/7503.003.0025"},{"key":"14_CR5","doi-asserted-by":"crossref","unstructured":"Boser, B.E., Guyon, I., Vapnik, V.: A Training Algorithm for Optimal Margin Classifiers. In: Proceedings of the Fifth Annual Workshop on Computational Learning Theory (1992)","DOI":"10.1145\/130385.130401"},{"key":"14_CR6","unstructured":"Carreras, X., Mrquez, L.: Boosting Trees for Anti-spam Email Filtering. In: Proceedings of the 2001 International Conference on Recent Advances in Natural Language Processing (2001)"},{"key":"14_CR7","doi-asserted-by":"crossref","DOI":"10.1002\/0471200611","volume-title":"Elements of information theory","author":"T.M. Cover","year":"1991","unstructured":"Cover, T.M., Thomas, J.A.: Elements of information theory. Wiley-Interscience, New York, NY, USA (1991)"},{"key":"14_CR8","doi-asserted-by":"crossref","unstructured":"Dhillon, I.S., Mallela, S., Kumar, R.: Enhanced Word Clustering for Hierarchical Text Classifi-cation. In: Proceedings of the Eighth ACM SIGKDD International Conference on Knowledge Dis-covery and Data Mining (2002)","DOI":"10.1145\/775047.775076"},{"key":"14_CR9","doi-asserted-by":"crossref","unstructured":"Dhillon, I.S., Mallela, S., Modha, D.S.: Information-Theoretic Co-clustering. In: Proceedings of the Ninth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (2003)","DOI":"10.1145\/956750.956764"},{"key":"14_CR10","unstructured":"Frank, E., Witten, I.H.: Generating accurate rule sets without global optimization. In: Proceedings of the Fifteenth International Conference on Machine Learning (1998)"},{"key":"14_CR11","doi-asserted-by":"crossref","unstructured":"Hidalgo, J.G.: Evaluating cost-sensitive unsolicited bulk email categorization. In: Proceedings of 17th ACM Symposium on Applied Computing (2002)","DOI":"10.1145\/508791.508911"},{"key":"14_CR12","doi-asserted-by":"crossref","unstructured":"Joachims, T.: Learning to classify text using support vector machines. Dissertation, Kluwer (2002)","DOI":"10.1007\/978-1-4615-0907-3"},{"key":"14_CR13","doi-asserted-by":"crossref","unstructured":"Junejo, K., Yousaf, M., Karim, A.: A Two-Pass Statistical Approach for Automatic Persona-lized Spam Filtering. In: Proceedings of the ECML\/PKDD Discovery Challenge Workshop (2006)","DOI":"10.1109\/WI.2007.47"},{"key":"14_CR14","doi-asserted-by":"crossref","unstructured":"Klimt, F., Yang, Y.: The Enron corpus: A new dataset for email classification research. In: Proceedings of the European Conference on Machine Learning (2004)","DOI":"10.1007\/978-3-540-30115-8_22"},{"issue":"1","key":"14_CR15","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1214\/aoms\/1177729694","volume":"22","author":"S. Kullback","year":"1951","unstructured":"Kullback, S., Leibler, R.A.: On information and sufficiency. Annals of Mathematical Statis-tics\u00a022(1), 79\u201386 (1951)","journal-title":"Annals of Mathematical Statis-tics"},{"key":"14_CR16","doi-asserted-by":"crossref","first-page":"839","DOI":"10.1148\/radiology.148.3.6878708","volume":"148","author":"J. Hanley","year":"1983","unstructured":"Hanley, J., McNeil, B.: A Method of Comparing the Areas under Receiver Operating Characteristic Curves Derived from the Same Cases. Radiology\u00a0148, 839\u2013843 (1983)","journal-title":"Radiology"},{"key":"14_CR17","unstructured":"Lewis, D.D.: Representation and Learning in Information Retrieval. Doctoral dissertation, Amherst, MA, USA (1992)"},{"key":"14_CR18","unstructured":"Metsis, V., Androutsopoulos, I., Paliouras, G.: Spam Filtering with Naive Bayes? Which Naive Bayes? In: Proceedings of the 3rd Conference on Email and Anti-Spam (2006)"},{"key":"14_CR19","unstructured":"Michelakis, E., Androutsopoulos, I., Paliouras, G., Sakkis, G., Stamatopoulos, P.: Filtron: A Learning-Based Anti-Spam Filter. In: Proceedings of the 1st Conference on Email and Anti-Spam (2004)"},{"key":"14_CR20","volume-title":"C4.5: Programs for Machine Learning","author":"J.R. Quinlan","year":"1993","unstructured":"Quinlan, J.R.: C4.5: Programs for Machine Learning. Morgan Kaufmann, San Mateo, CA (1993)"},{"key":"14_CR21","unstructured":"Rocchio, J.J.: Relevance Feedback in Information Retrieval. In: The SMART Retrieval System: Experiments in Automatics Document Processing (1971)"},{"key":"14_CR22","unstructured":"Sahami, M., Dumais, S., Heckerman, D., Horvitz, E.: A Bayesian Approach to Filtering Junk E-mail. In: AAAI 1998 Workshop on Learning for Text Categorization (1998)"},{"key":"14_CR23","doi-asserted-by":"crossref","unstructured":"Slonim, N., Tishby, N.: Document Clustering using Word Clusters via the Information Bottle-neck Method. In: Proceedings of the Twenty-Third Annual International ACM SIGIR Conference on Research and Development in Information Retrieval (2000)","DOI":"10.1145\/345508.345578"},{"key":"14_CR24","unstructured":"Yang, Y., Pedersen, J.O.: A Comparative Study on Feature Selection in Text Categorization. In: Proceedings of Fourteenth International Conference on Machine Learning (1997)"},{"key":"14_CR25","unstructured":"Zhang, L., Yao, T.: Filtering Junk Mail with a Maximum Entropy Model. In: Proceedings of the 20th International Conference on Computer Processing of Oriental Languages (2003)"}],"container-title":["Lecture Notes in Computer Science","Web Information Systems Engineering \u2013 WISE 2007"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-76993-4_14.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,18]],"date-time":"2024-02-18T21:43:07Z","timestamp":1708292587000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-76993-4_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540769927"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-76993-4_14","relation":{},"subject":[]}}