{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T15:50:57Z","timestamp":1742917857433,"version":"3.40.3"},"publisher-location":"London","reference-count":24,"publisher":"Springer London","isbn-type":[{"type":"print","value":"9781447123170"},{"type":"electronic","value":"9781447123187"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-1-4471-2318-7_20","type":"book-chapter","created":{"date-parts":[[2011,11,11]],"date-time":"2011-11-11T18:59:10Z","timestamp":1321037950000},"page":"255-268","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Web-Site Boundary Detection Using Incremental RandomWalk Clustering"],"prefix":"10.1007","author":[{"given":"Ayesh","family":"Alshukri","sequence":"first","affiliation":[]},{"given":"Frans","family":"Coenen","sequence":"additional","affiliation":[]},{"given":"Michele","family":"Zito","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2011,10,14]]},"reference":[{"key":"20_CR1","doi-asserted-by":"crossref","unstructured":"S. Abiteboul, G. Cobena, J. Masan\u00e9s, and G. Sedrati. A First Experience in Archiving the French Web. In ECDL \u201902 Proceedings of the 6th European Conference on Research and Advanced Technology for Digital Libraries, volume 2458 of Lecture Notes in Computer Science, pages 1\u201315. Springer, 2002.","DOI":"10.1007\/3-540-45747-X_1"},{"key":"20_CR2","doi-asserted-by":"crossref","unstructured":"R. Albert, H. Jeong, and A-l. Barab\u00e1si. Diameter of the world wide web. Computing Research Repository, 1999.","DOI":"10.1038\/43601"},{"key":"20_CR3","unstructured":"D. Aldous and J. Fill. Reversible Markov chains and random walks on graphs. Monograph in preparation, 2002."},{"key":"20_CR4","doi-asserted-by":"crossref","unstructured":"R. Aleliunas, R.M. Karp, R.J. Lipton, L. Lovasz, and C. Rackoff. Random walks, universal traversal sequences, and the complexity of maze problems. 20th Annual Symp. on Foundations of Computer Science, pages 218\u2013223, 1979.","DOI":"10.1109\/SFCS.1979.34"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"A Alshukri, F. Coenen, and M. Zito. Web-Site Boundary Detection. In Proceedings of the 10th Industrial Conference on Data Mining, pages 529\u2013543, Berlin, Germany, 2010. Springer.","DOI":"10.1007\/978-3-642-14400-4_41"},{"key":"20_CR6","doi-asserted-by":"crossref","unstructured":"Albert-Laszloand Barabasi and Reka Albert. Emergence of scaling in random networks. Science, 1999.","DOI":"10.1126\/science.286.5439.509"},{"key":"20_CR7","doi-asserted-by":"crossref","unstructured":"K. Bharat, B-W. Chang, M. Henzinger, and M. Ruhl. Who links to whom: mining linkage between Web sites. In Proceedings 2001 IEEE International Conference on Data Mining, pages 51\u201358, Washington, DC, USA, 2001. IEEE Computer Society.","DOI":"10.1109\/ICDM.2001.989500"},{"issue":"1-6","key":"20_CR8","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1016\/S1389-1286(00)00083-9","volume":"33","author":"A. Z Broder","year":"2000","unstructured":"A. Z Broder. Graph structure in the Web. Computer Networks, 33(1-6):309\u2013320, June 2000.","journal-title":"Computer Networks"},{"key":"20_CR9","doi-asserted-by":"crossref","unstructured":"A. Z Broder, M Najork, and J. LWiener. Efficient URL caching for world wide web crawling. In WWW\u201903 Proceedings of the 12th international conference on World Wide Web, pages 679\u2013689, Budapest, Hungary., 2003. ACM.","DOI":"10.1145\/775152.775247"},{"key":"20_CR10","doi-asserted-by":"crossref","unstructured":"P. Dmitriev. As we may perceive: finding the boundaries of compound documents on the web. In WWW\u201908 Proceeding of the 17th international conference on World Wide Web, pages 1029\u20131030, Beijing, China, 2008. ACM.","DOI":"10.1145\/1367497.1367640"},{"key":"20_CR11","volume-title":"Data Mining: Introductory and Advanced Topics","author":"M. H. Dunham","year":"2002","unstructured":"M. H. Dunham. Data Mining: Introductory and Advanced Topics. Prentice Hall PTR Upper Saddle River, NJ, USA, 2002."},{"key":"20_CR12","unstructured":"W. Feller. Introduction to probability theory and its applications. WSS, vol. 1, 1968."},{"key":"20_CR13","unstructured":"J. Han and M. Kamber. Data Mining: Concepts and Techniques. Morgan Kaufmann, 2001."},{"key":"20_CR14","doi-asserted-by":"crossref","unstructured":"M. Henzinger. Finding near-duplicate web pages: a large-scale evaluation of algorithms. In Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval, pages 284\u2013291. ACM, 2006.","DOI":"10.1145\/1148170.1148222"},{"issue":"11-16","key":"20_CR15","doi-asserted-by":"publisher","first-page":"1481","DOI":"10.1016\/S1389-1286(99)00040-7","volume":"31","author":"R. Kumar","year":"1999","unstructured":"R. Kumar. Trawling the Web for emerging cyber-communities. Computer Networks, 31(11-16):1481\u20131493, May 1999.","journal-title":"Computer Networks"},{"key":"20_CR16","doi-asserted-by":"crossref","unstructured":"R. Kumar, P. Raghavan, S. Rajagopalan, D. Sivakumar, A. Tomkins, and E. Upfal. Stochastic models for the Web graph. In Proceedings 41st Annual Symposium on Foundations of Computer Science, pages 57\u201365, Washington, DC, USA, 2000. IEEE Computer Society.","DOI":"10.1109\/SFCS.2000.892065"},{"key":"20_CR17","volume-title":"Web Data Mining: Exploring Hyperlinks, Contents, and Usage Data","author":"B. Liu","year":"2007","unstructured":"B. Liu. Web Data Mining: Exploring Hyperlinks, Contents, and Usage Data. Springer, Springer-Verlag New York, Inc., 2007."},{"key":"20_CR18","first-page":"1","volume":"2","author":"L. Lov\u00e1sz","year":"1994","unstructured":"L. Lov\u00e1sz. Random walks on graphs: A survey. YaleU\/DCS\/TR-1029, 2:1\u201346, 1994.","journal-title":"YaleU\/DCS\/TR-1029"},{"issue":"10","key":"20_CR19","doi-asserted-by":"publisher","first-page":"1027","DOI":"10.1016\/S0167-8655(99)00069-0","volume":"20","author":"J.M Pe\u00f1a","year":"1999","unstructured":"J.M Pe\u00f1a, J.A Lozano, and P Larra\u00f1aga. An empirical comparison of four initialization methods for the K-Means algorithm. Pattern Recognition Letters, 20(10):1027\u20131040, October 1999.","journal-title":"Pattern Recognition Letters"},{"issue":"4","key":"20_CR20","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1109\/MCSE.2004.24","volume":"6","author":"J. Pokorn","year":"2004","unstructured":"J. Pokorn. Web Searching and Information Retrieval. Computing in Science and Engineering, 6(4):43\u201348, 2004.","journal-title":"Computing in Science and Engineering"},{"key":"20_CR21","doi-asserted-by":"crossref","unstructured":"P. Senellart. Identifying Websites with Flow Simulation. In David Lowe and Martin Gaedke, editors, ICWE, volume 3579 of Lecture Notes in Computer Science, Orsay, France., 2005. Gemo, INRIA Futurs., Springer.","DOI":"10.1007\/11531371_18"},{"key":"20_CR22","unstructured":"P. N. Tan, M. Steinbach, and V. Kumar. Introduction to Data Mining. Pearson International Edition, 2006."},{"key":"20_CR23","unstructured":"B. Meck Thiesson, C. Chickering, and D. Heckerman. Learning mixtures of Bayesian networks. Technical report, Microsoft Research Technical Report TR-97-30, Redmond, WA, 1997."},{"key":"20_CR24","unstructured":"I. H. Witten and E. Frank. Data Mining: practical machine learning tools and techniques. Morgan Kaufman, 2005."}],"container-title":["Research and Development in Intelligent Systems XXVIII"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-1-4471-2318-7_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,14]],"date-time":"2025-03-14T00:35:34Z","timestamp":1741912534000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-1-4471-2318-7_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9781447123170","9781447123187"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-1-4471-2318-7_20","relation":{},"subject":[],"published":{"date-parts":[[2011]]},"assertion":[{"value":"14 October 2011","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}