{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,4]],"date-time":"2025-05-04T04:06:27Z","timestamp":1746331587271,"version":"3.40.4"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319089751"},{"type":"electronic","value":"9783319089768"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-08976-8_4","type":"book-chapter","created":{"date-parts":[[2014,7,17]],"date-time":"2014-07-17T14:03:29Z","timestamp":1405605809000},"page":"39-54","source":"Crossref","is-referenced-by-count":10,"title":["Analysis and Evaluation of Web Pages Classification Techniques for Inappropriate Content Blocking"],"prefix":"10.1007","author":[{"given":"Igor","family":"Kotenko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrey","family":"Chechulin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrey","family":"Shorov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dmitry","family":"Komashinsky","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"unstructured":"Agrwal, R., Srikant, R.: First algorithms for mining association rules. In: Proc. of the 20th Very Large Data Bases Conference, pp. 487\u2013499 (1994)","key":"4_CR1"},{"doi-asserted-by":"crossref","unstructured":"Baykan, E., Henzinger, M., Marian, L., Weber, I.: Purely URL-based topic classification. In: Proc. of the WWW 2009, New York, USA, pp. 1109\u20131110 (2009)","key":"4_CR2","DOI":"10.1145\/1526709.1526880"},{"doi-asserted-by":"crossref","unstructured":"Calado, P., Cristo, M., Moura, E., Ziviani, N., Ribeiro-Neto, B., Goncalves, M.A.: Combining link-based and content-based methods for web document classification. In: Proc. of the CIKM 2003, New York, USA, pp. 394\u2013401 (2003)","key":"4_CR3","DOI":"10.1145\/956863.956938"},{"issue":"3","key":"4_CR4","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1007\/s007780050061","volume":"7","author":"S. Chakrabarti","year":"1998","unstructured":"Chakrabarti, S., Dom, B., Agrawal, R., Raghavan, P.: Scalable feature selection, classification and signature generation for organizing large text databases into hierarchical topic taxonomies. The Intern. Journ. on Very Large Data Bases\u00a07(3), 163\u2013178 (1998)","journal-title":"The Intern. Journ. on Very Large Data Bases"},{"doi-asserted-by":"crossref","unstructured":"Cooley, R., Mobasher, B., Srivastava, J.: Web mining: Information and pattern discovery on the world wide web. In: Proc. of the ICTAI 1997, pp. 558\u2013567 (1997)","key":"4_CR5","DOI":"10.1109\/TAI.1997.632303"},{"key":"4_CR6","first-page":"256","volume-title":"Proc. of the SIGIR 2000","author":"S. Dumais","year":"2000","unstructured":"Dumais, S., Chen, H.: Hierarchical classification of Web content. In: Proc. of the SIGIR 2000, pp. 256\u2013263. ACM, New York (2000)"},{"doi-asserted-by":"crossref","unstructured":"Dumais, S.T., Platt, J., Heckermann, D., Sahami, M.: Inductive learning algorithms and representations for text categorization. In: Proc. of the CIKM 1998, pp. 148\u2013155 (1998)","key":"4_CR7","DOI":"10.1145\/288627.288651"},{"unstructured":"F-Secure company, http:\/\/www.f-secure.com\/","key":"4_CR8"},{"unstructured":"Java HTML Parser, http:\/\/jsoup.org\/","key":"4_CR9"},{"key":"4_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1007\/BFb0026683","volume-title":"Machine Learning: ECML-98","author":"T. Joachims","year":"1998","unstructured":"Joachims, T.: Text categorization with support vector machines: learning with many relevant features. In: N\u00e9dellec, C., Rouveirol, C. (eds.) ECML 1998. LNCS, vol.\u00a01398, pp. 137\u2013142. Springer, Heidelberg (1998)"},{"doi-asserted-by":"crossref","unstructured":"Kan, M.Y., Thi, H.O.N.: Fast webpage classification using url features. In: Proc. of the CIKM 2005, New York, USA, pp. 325\u2013326 (2005)","key":"4_CR11","DOI":"10.1145\/1099554.1099649"},{"doi-asserted-by":"crossref","unstructured":"Kan, M.Y.: Web page classification without the web page. In: Proc. of the WWW Alt. 2004, New York, USA, pp. 262\u2013263 (2004)","key":"4_CR12","DOI":"10.1145\/1013367.1013426"},{"key":"4_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/3-540-48686-0_1","volume-title":"Computing and Combinatorics","author":"J.M. Kleinberg","year":"1999","unstructured":"Kleinberg, J.M., Kumar, R., Raghavan, P., Rajagopalan, S., Tomkins, A.S.: The Web as a Graph: Measurements, Models, and Methods. In: Asano, T., Imai, H., Lee, D.T., Nakano, S., Tokuyama, T. (eds.) COCOON 1999. LNCS, vol.\u00a01627, pp. 1\u201317. Springer, Heidelberg (1999)"},{"unstructured":"Komashinskiy, D.V., Kotenko, I.V., Chechulin, A.A.: Categorization of web sites for inadmissible web pages blocking. High Availability Systems\u00a0(2), 102\u2013106 (2011)","key":"4_CR14"},{"unstructured":"Kotenko, I.V., Chechulin, A.A., Shorov, A.V., Komashinkiy, D.V.: Automatic system for categorization of websites for blocking web pages with inappropriate. High Availability Systems\u00a0(3), 119\u2013127 (2013)","key":"4_CR15"},{"issue":"1","key":"4_CR16","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/S0306-4573(02)00022-5","volume":"29","author":"O.W. Kwon","year":"2003","unstructured":"Kwon, O.W., Lee, J.H.: Text categorization based on k-nearest neighbor approach for web site classification. Information Processing and Management: an International Journal\u00a029(1), 25\u201344 (2003)","journal-title":"Information Processing and Management: an International Journal"},{"doi-asserted-by":"crossref","unstructured":"Kwon, O.W., Lee, J.H.: Web page classification based on k-nearest neighbor approach. In: Proc. of the IRAL 2000, New York, USA, pp. 9\u201315 (2000)","key":"4_CR17","DOI":"10.1145\/355214.355216"},{"issue":"1","key":"4_CR18","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1145\/595576.595579","volume":"1","author":"Y.S. Lai","year":"2002","unstructured":"Lai, Y.S., Wu, C.H.: Meaningful term extraction and discriminative term selection in text categorization via unknown-word methodology. ACM Transactions on Asian Language Information Processing (TALIP)\u00a01(1), 34\u201364 (2002)","journal-title":"ACM Transactions on Asian Language Information Processing (TALIP)"},{"doi-asserted-by":"crossref","unstructured":"Lam, W., Ho, C.Y.: Using a generalized instance set for automatic text categorization. In: Proc. of the SIGIR 1998, Melbourne, Australia, pp. 81\u201389 (1998)","key":"4_CR19","DOI":"10.1145\/290941.290961"},{"doi-asserted-by":"crossref","unstructured":"Lewis, D.D.: An evaluation of phrasal and clustered representations on a text categorization task. In: Proc. of the SIGIR 1992, Copenhagen, Denmark, pp. 37\u201350 (1992)","key":"4_CR20","DOI":"10.1145\/133160.133172"},{"unstructured":"McCallum, A., Nigam, K.: A comparison of event models for naive Bayes text classification. In: Proc. of the AAAI\/ICML 1998, pp. 41\u201348. AAAI Press (1998)","key":"4_CR21"},{"unstructured":"Patil, A., Pawar, B.: Automated Classification of Web Sites using Naive Bayessian Algorithm. In: Proc. of the IMECS 2012, vol.\u00a01, p. 466 (2012)","key":"4_CR22"},{"doi-asserted-by":"crossref","unstructured":"Qi, X., Davison, B.D.: Knowing a Web Page by the Company It Keeps. In: Proc. of the CIKM 2006, pp. 228\u2013237 (2006)","key":"4_CR23","DOI":"10.1145\/1183614.1183650"},{"doi-asserted-by":"crossref","unstructured":"Qi, X., Davison, B.D.: Web Page Classification: Features and algorithms. ACM Computing Surveys (CSUR)\u00a041(2), article No.12 (2009)","key":"4_CR24","DOI":"10.1145\/1459352.1459357"},{"unstructured":"RapidMiner, http:\/\/rapid-i.com\/content\/view\/181\/190\/","key":"4_CR25"},{"key":"4_CR26","series-title":"The Springer International Series in Engineering and Computer Science","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1007\/978-1-4615-6163-7","volume-title":"Multimedia Information Retrieval: Content-Based Information Retrieval from Large Text and Audio Databases","author":"P. Schauble","year":"1997","unstructured":"Schauble, P.: Multimedia Information Retrieval: Content-Based Information Retrieval from Large Text and Audio Databases. The Springer International Series in Engineering and Computer Science, pp. 49\u201359. Kluwer Academic Publishers, Norwell (1997)"},{"issue":"6","key":"4_CR27","doi-asserted-by":"publisher","first-page":"897","DOI":"10.7763\/IJCTE.2010.V2.259","volume":"2","author":"S. Shibu","year":"2010","unstructured":"Shibu, S., Vishwakarma, A., Bhargava, N.: A combination approach for Web Page Classification using Page Rank and Feature Selection Technique. International Journal of Computer Theory and Engineering\u00a02(6), 897\u2013900 (2010)","journal-title":"International Journal of Computer Theory and Engineering"},{"key":"4_CR28","series-title":"LNAI","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1007\/3-540-45490-X_36","volume-title":"Web Intelligence: Research and Development","author":"M. Tsukada","year":"2001","unstructured":"Tsukada, M., Washio, T., Motoda, H.: Automatic Web-Page Classification by Using Machine Learning Methods. In: Zhong, N., Yao, Y., Ohsuga, S., Liu, J. (eds.) WI 2001. LNCS (LNAI), vol.\u00a02198, pp. 303\u2013313. Springer, Heidelberg (2001)"},{"doi-asserted-by":"crossref","unstructured":"Xu, Z., Yan, F., Qin, J., Zhu, H.: A Web Page Classification Algorithm Based on Link Information. In: Proc. of the DCABES 2011, pp. 82\u201386. IEEE Computer Society (2011)","key":"4_CR29","DOI":"10.1109\/DCABES.2011.19"},{"unstructured":"Yandex. Translate API: http:\/\/api.yandex.com\/translate\/","key":"4_CR30"},{"doi-asserted-by":"crossref","unstructured":"Yang, Y., Liu, X.: A re-examination of text categorization methods. In: Proc. of the SIGIR 1999, Berkeley, CA, pp. 42\u201349 (1999)","key":"4_CR31","DOI":"10.1145\/312624.312647"}],"container-title":["Lecture Notes in Computer Science","Advances in Data Mining. Applications and Theoretical Aspects"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-08976-8_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,3]],"date-time":"2025-05-03T21:10:11Z","timestamp":1746306611000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-08976-8_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319089751","9783319089768"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-08976-8_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}