{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T00:17:36Z","timestamp":1725495456199},"publisher-location":"Berlin, Heidelberg","reference-count":20,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540001300"},{"type":"electronic","value":"9783540361282"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2002]]},"DOI":"10.1007\/3-540-36128-6_25","type":"book-chapter","created":{"date-parts":[[2007,11,13]],"date-time":"2007-11-13T22:20:41Z","timestamp":1194992441000},"page":"420-434","source":"Crossref","is-referenced-by-count":3,"title":["Mining HTML Pages to Support Document Sharing in a Cooperative System"],"prefix":"10.1007","author":[{"given":"Donato","family":"Malerba","sequence":"first","affiliation":[]},{"given":"Floriana","family":"Esposito","sequence":"additional","affiliation":[]},{"given":"Michelangelo","family":"Ceci","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2002,11,8]]},"reference":[{"issue":"3","key":"25_CR1","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1145\/183422.183423","volume":"12","author":"C. Apt\u00e9","year":"1994","unstructured":"C. Apt\u00e9, F. Damerau, & S.M. Weiss (1994). Automated learning of decision rules for text categorization. ACM Transactions on Information Systems, 12(3), 233\u2013251.","journal-title":"ACM Transactions on Information Systems"},{"unstructured":"G. Attardi, S. DMarco, D. Salvi, & F. Sebastiani (1998). Categorisation by context. Online Proceedings of the 1\n                           \n                    st\n                  \n                           International Workshop on Innovative Internet Information Systems, \n                    \n                      http:\/\/www.idt.ntnu.no\/~monica\/iii-98\/proceedinas on line.html","key":"25_CR2"},{"unstructured":"R. Baumgartner, S. Flesca, G. Gottlob (2001). Supervised Wrapper Generation with Lixto. Proc. of the 27\n                           \n                    th\n                  \n                           Int. Conf. on Very Large Data Bases, 715\u2013716.","key":"25_CR3"},{"key":"25_CR4","doi-asserted-by":"crossref","first-page":"37","DOI":"10.3233\/ISU-1984-41-204","volume":"4","author":"C. Cleverdon","year":"1984","unstructured":"C. Cleverdon (1984). Optimizing convenient online access to bibliographic databases. Information Services and Use, 4, 37\u201347.","journal-title":"Information Services and Use"},{"key":"25_CR5","volume-title":"Proc. of the 6th Int. Conf. on Document Analysis and Recognition ICDAR\u201901","author":"M. Diligenti","year":"2001","unstructured":"M. Diligenti, M. Gori, M. Maggini & F. Scarselli (2001). Classification of HTML Documents by Hidden Tree-Markov Models. Proc. of the 6\n                           \n                    th\n                  \n                           Int. Conf. on Document Analysis and Recognition ICDAR\u201901, IEEE Computer Society Press, Los Vaqueros, CA."},{"key":"25_CR6","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"190","DOI":"10.1007\/3-540-46238-4_17","volume-title":"AI*IA 99: Advances in Artificial Intelligence","author":"F. Esposito","year":"2000","unstructured":"F. Esposito, D. Malerba, L. Di Pace, & P. Leo (2000). A Machine Learning Approach to Web Mining, In E. Lamma & P. Mello (Eds.), AI*IA 99: Advances in Artificial Intelligence, Lecture Notes in Artificial Intelligence, Vol. 1792, 190\u2013201, Berlin: Springer."},{"unstructured":"T. Joachims (1997). A probabilistic analysis of the Rocchio algorithm with TFIDF for text categorization. Proc. of the 14\n                           \n                    th\n                  \n                           Int. Conf. on Machine Learning, 143\u2013151.","key":"25_CR7"},{"unstructured":"D. Koller & M. Sahami (1996). Toward optimal feature selection. Proc. of the 13\n                           \n                    th\n                  \n                           Int. Conf. on Machine Learning ICML\u201996, 284\u2013292.","key":"25_CR8"},{"doi-asserted-by":"crossref","unstructured":"D.D. Lewis, R.E. Schapire, J.P. Callan, & R. Papka (1996). Training algorithms for linear text classifiers. In H.-P. Frei, D. Harman, P. Schauble, & R. Wilkinson, (ed.), Proc. of the 19\n                           \n                    th\n                  \n                           Annual Int. ACM SIGIR Conf. on Research and Development in Information Retrieval, 298\u2013306.","key":"25_CR9","DOI":"10.1145\/243199.243277"},{"issue":"2","key":"25_CR10","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1147\/rd.22.0159","volume":"2","author":"H. Luhn","year":"1958","unstructured":"H. Luhn (1958). The automatic creation of literature abstracts. IBM Journal of Research and Development, 2(2): 159\u2013165.","journal-title":"IBM Journal of Research and Development"},{"key":"25_CR11","first-page":"59","volume":"92","author":"B. Masand","year":"1992","unstructured":"B. Masand, G. Linoff, & D. Waltz (1992). Classifying new stories using memory based reasoning. Proc. SIGIR\u201992, 59\u201365.","journal-title":"Proc. SIGIR\u2019"},{"key":"25_CR12","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1007\/BFb0026677","volume-title":"Machine Learning: ECML-98","author":"D. Mladenic","year":"1998","unstructured":"D. Mladenic (1998). Feature subset selection in text-learning. In C. N\u00e9dellec, & C. Rouveirol (Eds.), Machine Learning: ECML-98, Lecture Notes in Artificial Intelligence, 1398, 95\u2013100, Berlin: Springer."},{"key":"25_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/BF00871744","volume":"2","author":"S.K. Murthy","year":"1994","unstructured":"S.K. Murthy, S. Kasif & S. Salzberg (1994). A system for induction of oblique decision trees. Journal of Artificial Intelligence Research, 2, 1\u201332.","journal-title":"Journal of Artificial Intelligence Research"},{"key":"25_CR14","doi-asserted-by":"publisher","first-page":"313","DOI":"10.1023\/A:1007369909943","volume":"23","author":"M. Pazzani","year":"1997","unstructured":"M. Pazzani & D. Billsus (1997). Learning and revising user profiles: The identification of interesting web sites. Machine Learning Journal, 23, 313\u2013331.","journal-title":"Machine Learning Journal"},{"issue":"3","key":"25_CR15","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"M. F. Porter","year":"1980","unstructured":"M. F. Porter (1980). An algorithm for suffix stripping. Program, 14(3): 130\u2013137.","journal-title":"Program"},{"key":"25_CR16","volume-title":"Automatic text processing: The transformation, analysis, and retrieval of information by computer","author":"G. Salton","year":"1989","unstructured":"G. Salton (1989). Automatic text processing: The transformation, analysis, and retrieval of information by computer. Reading, MA: Addison-Wesley."},{"issue":"5","key":"25_CR17","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1016\/0306-4573(88)90021-0","volume":"24","author":"G. Salton","year":"1988","unstructured":"G. Salton & C. Buckley (1988). Term weighting approaches in automatic text retrieval. Information Processing and Management, 24(5), 513\u2013523.","journal-title":"Information Processing and Management"},{"issue":"4","key":"25_CR18","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1016\/0306-4573(95)00011-5","volume":"31","author":"W.M. Shaw Jr","year":"1995","unstructured":"W.M. Shaw Jr (1995). Term-relevance computations and perfect retrieval performance. Information Processing & Management, 31(4), 491\u2013498.","journal-title":"Information Processing & Management"},{"unstructured":"Y. Yang & J.O. Pedersen (1997). A Comparative Study on Feature Selection in Text Categorization. Proc. of the 14\n                           \n                    th\n                  \n                           Int. Conf. on Machine Learning ICML-97, 412\u2013420.","key":"25_CR19"},{"key":"25_CR20","volume-title":"Human Behavior and the Principle of Least Effort","author":"G.K. Zipf","year":"1949","unstructured":"G.K. Zipf (1949). Human Behavior and the Principle of Least Effort. Reading, MA: Addison-Wesley."}],"container-title":["Lecture Notes in Computer Science","XML-Based Data Management and Multimedia Engineering \u2014 EDBT 2002 Workshops"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-36128-6_25","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,2,25]],"date-time":"2019-02-25T07:20:05Z","timestamp":1551079205000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-36128-6_25"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2002]]},"ISBN":["9783540001300","9783540361282"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/3-540-36128-6_25","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2002]]}}}