{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,2]],"date-time":"2025-05-02T04:16:28Z","timestamp":1746159388801,"version":"3.40.4"},"publisher-location":"Berlin, Heidelberg","reference-count":16,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642543401"},{"type":"electronic","value":"9783642543418"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-642-54341-8_42","type":"book-chapter","created":{"date-parts":[[2014,2,21]],"date-time":"2014-02-21T11:39:00Z","timestamp":1392982740000},"page":"404-413","source":"Crossref","is-referenced-by-count":0,"title":["Chinese Web Content Extraction Based on Na\u00efve Bayes Model"],"prefix":"10.1007","author":[{"given":"Wang","family":"Jinbo","sequence":"first","affiliation":[]},{"given":"Wang","family":"Lianzhi","sequence":"additional","affiliation":[]},{"given":"Gao","family":"Wanlin","sequence":"additional","affiliation":[]},{"given":"Yu","family":"Jian","sequence":"additional","affiliation":[]},{"given":"Cui","family":"Yuntao","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"42_CR1","unstructured":"Li, X.: Harmonious man-machine environment, vol.\u00a01, pp. 101\u2013107. Tsinghua University press, Beijing (January 1, 2008)"},{"issue":"4","key":"42_CR2","first-page":"32","volume":"39","author":"Q. Wu","year":"2011","unstructured":"Wu, Q., Chen, X., Tan, J.: Content Extraction Algorithm of HTML Pages Based on Optimized Weight. Journal of South China University of Technology (natural science edition)\u00a039(4), 32\u201337 (2011)","journal-title":"Journal of South China University of Technology (natural science edition)"},{"key":"42_CR3","unstructured":"Hsu, C.-H.: Initial Results on Wrapping Semi-structured Web Pages with Finite-State Transducers and Contextual Rules. In: Workshop on AI and Information Integration, in Conjunction with the 15\u2019th National Conference on Artificial Intelligence (AAAI 1998), Madison, Wisconsin (July 1998)"},{"key":"42_CR4","doi-asserted-by":"crossref","unstructured":"Bar-Yossef, Z., Rajagopalan, S.: Template detection via data mining and its applications. In: 11th World Wide Web Conference (WWW 2002), Hawaii, USA (2002)","DOI":"10.1145\/511519.511522"},{"issue":"5","key":"42_CR5","first-page":"1077","volume":"45","author":"J. Yang","year":"2008","unstructured":"Yang, J., Li, Z.: DOM-based information extraction for WEB-pages topic. DOM-based Information Extraction for WEB-pages Topic\u00a045(5), 1077\u20131080 (2008)","journal-title":"DOM-based Information Extraction for WEB-pages Topic"},{"key":"42_CR6","unstructured":"Deng, C., Yu, S.P., Wen, J.R., VIPS: A Vision-Based Page Segmentation [MSR-TR-2003-79] (2003)"},{"key":"42_CR7","unstructured":"Manning, C.D., Raghavan, P., Schutze, H.: Introduction to Information Retrieval, vol.\u00a01, pp. 175\u2013182. People\u2019s Posts and Telecommunications Press, Beijing (January 01, 2010)"},{"key":"42_CR8","unstructured":"Shoubin, D., Hua, Y.: The network information retrieval, vol.\u00a01, pp. 93\u201399. Xi\u2019an Electronic and Science University press, Xi\u2019an (April 01, 2010)"},{"key":"42_CR9","unstructured":"MacDonald, M.: WPF Programming book, vol.\u00a01, pp. 694\u2013698. Tsinghua University Press, Beijing (June 1, 2011)"},{"key":"42_CR10","unstructured":"HTML resolve [EB\/OL] , http:\/\/litertiger.blog.163.com\/blog\/static\/824538200693093340410\/"},{"key":"42_CR11","unstructured":"Borenstein, M.: Meta. Analysis: An Introduction. Science Press, Beijing (January 2013)"},{"key":"42_CR12","unstructured":"Zhao, Y., Xie, X., Xun, Y.: Application of Naive Bias classification. Electronic Production, 7 (2013)"},{"key":"42_CR13","doi-asserted-by":"crossref","unstructured":"Kupiec, J., Pedersen, J., Chen, F.: A Trainable Document Summarizer in Proceedings of the Eighth Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, Seattle,Washington, pp. 68\u201373 (July 1995)","DOI":"10.1145\/215206.215333"},{"key":"42_CR14","unstructured":"Wu, Q., Chen, X., Tan, J.: Webpage content extraction algorithm based on optimized weight. Journal of South China University of Technology (Natural Science Edition)\u00a0(4) (2011)"},{"key":"42_CR15","unstructured":"Wang, C., Xu, J.: Webpage blocks and blocks of text extraction research based on the CURE algorithm. Microcomputer and its Application\u00a0(12) (2012)"},{"key":"42_CR16","doi-asserted-by":"crossref","unstructured":"Guo, Y., Tang, H., Song, L., Wang, Y., Ding, G.: In: Source: Advances in Web Technologies and Applications - Proceedings of the 12th Asia-Pacific Web Conference, APWeb 2010, pp. 314\u2013320 (2010)","DOI":"10.1109\/APWeb.2010.11"}],"container-title":["IFIP Advances in Information and Communication Technology","Computer and Computing Technologies in Agriculture VII"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-54341-8_42","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,1]],"date-time":"2025-05-01T22:15:07Z","timestamp":1746137707000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-54341-8_42"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783642543401","9783642543418"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-54341-8_42","relation":{},"ISSN":["1868-4238","1868-422X"],"issn-type":[{"type":"print","value":"1868-4238"},{"type":"electronic","value":"1868-422X"}],"subject":[],"published":{"date-parts":[[2014]]}}}