{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T17:48:46Z","timestamp":1725731326757},"publisher-location":"New York, NY","reference-count":18,"publisher":"Springer New York","isbn-type":[{"type":"print","value":"9781461468790"},{"type":"electronic","value":"9781461468806"}],"license":[{"start":{"date-parts":[[2013,1,1]],"date-time":"2013-01-01T00:00:00Z","timestamp":1356998400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-1-4614-6880-6_30","type":"book-chapter","created":{"date-parts":[[2013,6,12]],"date-time":"2013-06-12T12:08:16Z","timestamp":1371038896000},"page":"345-355","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Research on Indexing Page Collection Selection Method for Search Engine"],"prefix":"10.1007","author":[{"given":"Liyun","family":"Ru","sequence":"first","affiliation":[]},{"given":"Zhichao","family":"Li","sequence":"additional","affiliation":[]},{"given":"Yingying","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Shaoping","family":"Ma","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2013,5,2]]},"reference":[{"issue":"8","key":"30_CR00301","first-page":"22","volume":"17","author":"A. Agrawal","year":"2011","unstructured":"Agrawal, A., Husain, M., Tiwari, R.G., et al.: A novel technique for database selection and document selection. Int. J. Comput. Appl. 17(8), 22\u201326 (2011)","journal-title":"Int. J. Comput. Appl."},{"key":"30_CR00302","doi-asserted-by":"crossref","unstructured":"Lin, H., Zhang, Y., Davis, J.: Best document selection based on approximate utility optimization. In: Proceedings of the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 1215\u20131216. ACM, New York (2011)","DOI":"10.1145\/2009916.2010126"},{"key":"30_CR00303","doi-asserted-by":"crossref","unstructured":"Welch, M.J., Cho, J., Olston, C.: Search result diversity for informational queries. In: Proceedings of the 20th International Conference on World Wide Web, pp. 237\u2013246. ACM, New York (2011)","DOI":"10.1145\/1963405.1963441"},{"key":"30_CR00304","unstructured":"Broder, A.Z.: Identifying and filtering near-duplicate documents. In: Proceedings of the 11th Annual Symposium on Combinatorial Pattern Matching, 2000, pp. 1\u201310"},{"key":"30_CR00305","unstructured":"Broder, A.Z., Classman, S.C., Manasse, M.S.: Syntactic clustering of the Web. In: Proceedings of the 6th International Web Conference, 1997, pp. 11\u201320"},{"issue":"7","key":"30_CR00306","first-page":"16","volume":"19","author":"M. Mathew","year":"2011","unstructured":"Mathew, M., Shine, N.D., Lakshmi, T.R., et al.: A novel approach for near-duplicate detection of Web pages using TDW matrix. Int. J. Comput. Appl. 19(7), 16\u201321 (2011)","journal-title":"Int. J. Comput. Appl."},{"key":"30_CR00307","unstructured":"Dubes, R.C., Jain, A.K.: Algorithms for Clustering Data. Prentice Hall, New York (1988)"},{"key":"30_CR00308","unstructured":"Salloum, M., Tsotras, V.J., Srivastava, D., et al.: Selection and ordering of candidate documents for effective query answering in XML databases. In: Fifth International Workshop on Ranking in Databases, pp. 201\u2013207. ACM, New York (2011)"},{"key":"30_CR00309","first-page":"45","volume":"3","author":"Z. Ding","year":"2008","unstructured":"Ding, Z., Wu, B., Xin, Y.: Research of large-scale URL filter based on bloom filter. New Technol. Lib. Inform. Serv., 3, 45\u201350 (2008)","journal-title":"New Technol. Lib. Inform. Serv."},{"key":"30_CR003010","doi-asserted-by":"crossref","unstructured":"Charikar, M.S.: Similarity estimation techniques from rounding algorithms. In: Proceedings of the Thirty-Fourth Annual ACM Symposium on Theory of Computing, pp. 388\u2013397. ACM, New York (2002)","DOI":"10.1145\/509907.509965"},{"key":"30_CR003011","unstructured":"Page, L., Brin, S., Motwani, R., et al.: The PageRank Citation Ranking: Bringing Order to the Web. Stanford Digital Libraries, Stanford (1998)"},{"issue":"5","key":"30_CR003012","first-page":"3","volume":"25","author":"C. Wei","year":"2011","unstructured":"Wei, C., Chen, F., Xu, D., et al.: A framework for web page quality evaluation. J. Chin. Inform. Process. (AD of Publication, Beijing, China) 25(5), 3\u20138 (2011)","journal-title":"J. Chin. Inform. Process. (AD of Publication, Beijing, China)"},{"key":"30_CR003013","doi-asserted-by":"publisher","first-page":"516","DOI":"10.1007\/11562382_43","volume":"3689","author":"C Wang","year":"2005","unstructured":"Wang, C., Liu, Y., Zhang, M., et al.: Topic-independent web high-quality page selection based on K-means clustering. Lect. Notes Comput. Sci. 3689, 516\u2013521 (2005)","journal-title":"Lect. Notes Comput. Sci."},{"issue":"2","key":"30_CR003014","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1145\/2207243.2207252","volume":"13","author":"N. Spirin","year":"2012","unstructured":"Spirin, N., Han, J.: Survey on web spam detection: principles and algorithms. ACM SIGKDD Explorations Newslett., 13(2), 50\u201364 (2012)","journal-title":"ACM SIGKDD Explorations Newslett."},{"key":"30_CR003015","first-page":"576","volume-title":"Proceedings of the 30th International Conference on Very Large Databases (VLDB)","author":"Z Gyngyi","year":"2004","unstructured":"Gyngyi, Z., Garcia-Molina, H., Pedersen, J.: Combating web spam with TrustRank. In: Proceedings of the 30th International Conference on Very Large Databases (VLDB), pp. 576\u2013587. ACM, New York (2004)"},{"key":"30_CR003016","doi-asserted-by":"crossref","unstructured":"Rivest, R.: MIT Laboratory for Computer Science and RSA Data Security Inc. The MD5 message-digest algorithm[J], (1992)","DOI":"10.17487\/rfc1321"},{"key":"30_CR003017","unstructured":"Singh, D.: Improving web search ranking through user behavior information. Int. J. Inform. Technol. Knowl. Manag (Serials Publications, New Delhi, India) 4(2), 635\u2013638 (2011)"},{"issue":"1","key":"30_CR003018","first-page":"3","volume":"3","author":"M. Chen","year":"2011","unstructured":"Chen, M., Yamada, S., Takama, Y.: Investigating user behavior in document similarity judgment for interactive clustering-based search engines. J. Emerg. Technol. Web Intell. (Academy Publisher, Oulu, Finland) 3(1), 3\u201310 (2011)","journal-title":"J. Emerg. Technol. Web Intell. (Academy Publisher, Oulu, Finland)"}],"container-title":["Springer Proceedings in Complexity","Semantic Web and Web Science"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-1-4614-6880-6_30","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,21]],"date-time":"2019-05-21T08:39:09Z","timestamp":1558427949000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-1-4614-6880-6_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9781461468790","9781461468806"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-1-4614-6880-6_30","relation":{},"ISSN":["2213-8684","2213-8692"],"issn-type":[{"type":"print","value":"2213-8684"},{"type":"electronic","value":"2213-8692"}],"subject":[],"published":{"date-parts":[[2013]]},"assertion":[{"value":"2 May 2013","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}