{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T06:36:54Z","timestamp":1725691014059},"publisher-location":"Berlin, Heidelberg","reference-count":13,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642315756"},{"type":"electronic","value":"9783642315763"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-31576-3_5","type":"book-chapter","created":{"date-parts":[[2012,7,6]],"date-time":"2012-07-06T15:24:28Z","timestamp":1341588268000},"page":"35-42","source":"Crossref","is-referenced-by-count":2,"title":["Research on New Algorithm of Topic-Oriented Crawler and Duplicated Web Pages Detection"],"prefix":"10.1007","author":[{"given":"Yong-Heng","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Feng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"1","key":"5_CR1","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1177\/0920203X07075083","volume":"21","author":"H.J. Yu","year":"2007","unstructured":"Yu, H.J., Liu, Y.Q., Zhang, M., Ru, L.Y., Ma, S.P.: Research in Search Engine User Behavior Based on Log Analysis. Journal of Chinese Information Processing\u00a021(1), 109\u2013114 (2007) (in Chinese with English abstract)","journal-title":"Journal of Chinese Information Processing"},{"key":"5_CR2","unstructured":"Bra, P.D., Houdben, G., Kornatzky, Y.: Information Retrieval in Distributed Hypertexts. In: Proc of the 4th RIAO Conference, New York, pp. 481\u2013 491 (1994)"},{"key":"5_CR3","unstructured":"Gant, G., Srinivasan, P.: Topic-Driven Crawlers: Machine Learningissues. In: Proc of ACM TOIT (2004)"},{"issue":"2","key":"5_CR4","first-page":"97","volume":"28","author":"N. Angkawattanawit","year":"2005","unstructured":"Angkawattanawit, N., Rungsawang, A.: Learnable Topic- Specific Web Crawler. Massive Information & Knowledge Engineering\u00a028(2), 97\u2013114 (2005)","journal-title":"Massive Information & Knowledge Engineering"},{"issue":"4","key":"5_CR5","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1145\/1031114.1031117","volume":"4","author":"F. Menczer","year":"2004","unstructured":"Menczer, F., Pant, G., Srinivasan, P.: Topic Web Crawlers: Evaluating Adaptive Algorithm. ACM Transactions on Internet Technology\u00a04(4), 378\u2013419 (2004)","journal-title":"ACM Transactions on Internet Technology"},{"key":"5_CR6","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1007\/s10115-007-0071-9","volume":"14","author":"S.Z. Ye","year":"2007","unstructured":"Ye, S.Z., Ji, R.W., Ma, W.Y.: A Systematic Study on Parameter Correlations in Large-Scale Duplicate Document Detection. Knowledge and Information Systems\u00a014, 217\u2013232 (2007)","journal-title":"Knowledge and Information Systems"},{"key":"5_CR7","unstructured":"Hosseini, S., Cox, J.R.: Optimal Solution of Off-line And On-Line Generalized Caching. Technical Report, WUCS-96-20, washington University at St. Louis (1996)"},{"key":"5_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"355","DOI":"10.1007\/3-540-45691-0_34","volume-title":"Evaluation of Cross-Language Information Retrieval Systems","author":"E.M. Voorhees","year":"2002","unstructured":"Voorhees, E.M.: The Philosophy of Information Retrieval Evaluation. In: Peters, C., Braschler, M., Gonzalo, J., Kluck, M. (eds.) CLEF 2001. LNCS, vol.\u00a02406, pp. 355\u2013370. Springer, Heidelberg (2002)"},{"key":"5_CR9","doi-asserted-by":"crossref","unstructured":"Scholer, F., Williams, H.E., Yiannis, J., Zobel, J.: Compression of Inverted Indexes for Fast Query Evaluation. In: Proceedings of the 25th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 222\u2013229 (2002)","DOI":"10.1145\/564376.564416"},{"key":"5_CR10","doi-asserted-by":"crossref","unstructured":"Cockburn, A., Jones, S.: Which way now? Analysing and easing inadequacies in WWW navigation. International Journal of Human-Computer Studies\u00a045, 105\u2013129","DOI":"10.1006\/ijhc.1996.0044"},{"issue":"1","key":"5_CR11","doi-asserted-by":"publisher","first-page":"6","DOI":"10.1145\/331403.331405","volume":"33","author":"C. Silverstein","year":"1998","unstructured":"Silverstein, C., Henzinger, M., Marais, H.: Analysis of A Very Large Web Search Engine Query Log. SIGIR Forum\u00a033(1), 6\u201312 (1998)","journal-title":"SIGIR Forum"},{"key":"5_CR12","doi-asserted-by":"crossref","unstructured":"Andrei, B.: A Taxonomy of Web Search. SIGIR Forum\u00a036(2) (2002)","DOI":"10.1145\/792550.792552"},{"key":"5_CR13","doi-asserted-by":"crossref","unstructured":"Voorhees, E.M., Lori, P., Buckland, E.: The Eleventh Text Retrieval Conference (TREC 2002), vol. 11. National Institute of Standards and Technology, NIST (2003)","DOI":"10.6028\/NIST.SP.500-251"}],"container-title":["Lecture Notes in Computer Science","Intelligent Computing Theories and Applications"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-31576-3_5.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,4]],"date-time":"2021-05-04T12:13:06Z","timestamp":1620130386000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-31576-3_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642315756","9783642315763"],"references-count":13,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-31576-3_5","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}