{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T14:47:10Z","timestamp":1748616430020,"version":"3.33.0"},"publisher-location":"Berlin, Heidelberg","reference-count":83,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540720782"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-72079-9_7","type":"book-chapter","created":{"date-parts":[[2007,5,14]],"date-time":"2007-05-14T09:40:58Z","timestamp":1179135658000},"page":"231-262","source":"Crossref","is-referenced-by-count":19,"title":["Adaptive Focused Crawling"],"prefix":"10.1007","author":[{"given":"Alessandro","family":"Micarelli","sequence":"first","affiliation":[]},{"given":"Fabio","family":"Gasparetti","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"7_CR1","doi-asserted-by":"crossref","unstructured":"Aggarwal, C.C., Al-Garawi, F., Yu, P.S.: Intelligent Crawling on the World Wide Web with Arbitrary Predicates. In: Proceedings of the 10th World Wide Web Conference. WWW10, Hong Kong, pp. 96\u2013105 (2001), http:\/\/www10.org\/cdrom\/papers\/110\/","DOI":"10.1145\/371920.371955"},{"issue":"1","key":"7_CR2","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1145\/383034.383035","volume":"1","author":"A. Arasu","year":"2001","unstructured":"Arasu, A., Cho, J., Garcia-Molina, H., Paepcke, A., Raghavan, S.: Searching the Web. ACM Transactions on Internet Technology (TOIT)\u00a01(1), 2\u201343 (2001)","journal-title":"ACM Transactions on Internet Technology (TOIT)"},{"key":"7_CR3","unstructured":"Bailey, P., Craswell, N., Hawking, D.: Dark matter on the Web. In: Poster Proceedings of the 9th World Wide Web Conference, WWW9, Amsterdam, Netherlands (2000), http:\/\/www9.org\/final-posters\/poster30.html"},{"issue":"6","key":"7_CR4","doi-asserted-by":"publisher","first-page":"853","DOI":"10.1016\/S0306-4573(02)00084-5","volume":"39","author":"P. Bailey","year":"2003","unstructured":"Bailey, P., Craswell, N., Hawking, D.: Engineering a multi-purpose test collection for web retrieval experiments. Information Processing and Management\u00a039(6), 853\u2013871 (2003)","journal-title":"Information Processing and Management"},{"issue":"1-2","key":"7_CR5","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1023\/A:1008205606173","volume":"8","author":"M.. Balabanovi\u0107","year":"1998","unstructured":"Balabanovi\u0107, M.: Exploring versus exploiting when learning user models for text recommendation. User Modeling and User-Adapted Interaction\u00a08(1-2), 71\u2013102 (1998)","journal-title":"User Modeling and User-Adapted Interaction"},{"issue":"3","key":"7_CR6","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1145\/245108.245124","volume":"40","author":"M. Balabanovi\u0107","year":"1997","unstructured":"Balabanovi\u0107, M., Shoham, Y.: Fab: content-based, collaborative recommendation. Communications of the ACM\u00a040(3), 66\u201372 (1997), doi:10.1145\/245108.245124","journal-title":"Communications of the ACM"},{"key":"7_CR7","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1145\/1008992.1009048","volume-title":"SIGIR \u201904: Proceedings of the 27th annual international conference on Research and development in information","author":"S.M. Beitzel","year":"2004","unstructured":"Beitzel, S.M., Jensen, E.C., Chowdhury, A., Grossman, D., Frieder, O.: Hourly analysis of a very large topically categorized web query log. In: SIGIR \u201904: Proceedings of the 27th annual international conference on Research and development in information, pp. 321\u2013328. ACM Press, New York (2004)"},{"key":"7_CR8","doi-asserted-by":"crossref","unstructured":"Bergman, M.K.: The Deep Web: Surfacing Hidden Value. The Journal of Electronic Publishing\u00a07(1) (2001)","DOI":"10.3998\/3336451.0007.104"},{"key":"7_CR9","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1007\/3-540-45747-X_7","volume-title":"Research and Advanced Technology for Digital Libraries","author":"D. Bergmark","year":"2002","unstructured":"Bergmark, D., Lagoze, C., Sbityakov, A.: Focused Crawls, Tunneling, and Digital Libraries. In: Agosti, M., Thanos, C. (eds.) ECDL 2002. LNCS, vol.\u00a02458, pp. 91\u2013106. Springer, Heidelberg (2002), http:\/\/citeseer.ist.psu.edu\/bergmark02focused.html"},{"issue":"5","key":"7_CR10","doi-asserted-by":"publisher","first-page":"349","DOI":"10.1007\/s005300050098","volume":"6","author":"K. Bharat","year":"1998","unstructured":"Bharat, K., Kamba, T., Albers, M.: Personalized, interactive news on the Web. Multimedia Systems\u00a06(5), 349\u2013358 (1998), doi:10.1007\/s005300050098","journal-title":"Multimedia Systems"},{"issue":"8","key":"7_CR11","doi-asserted-by":"publisher","first-page":"711","DOI":"10.1002\/spe.587","volume":"34","author":"P. Boldi","year":"2004","unstructured":"Boldi, P., Codenotti, B., Santini, M., Vigna, S.: UbiCrawler: a scalable fully distributed web crawler. Software, Practice and Experience\u00a034(8), 711\u2013726 (2004), doi:10.1002\/spe.587","journal-title":"Software, Practice and Experience"},{"key":"7_CR12","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1038\/35017500","volume":"406","author":"E. Bonabeau","year":"2000","unstructured":"Bonabeau, E., Dorigo, M., Theraulaz, G.: Inspiration for optimization from social insect behavior. Nature\u00a0406, 39\u201342 (2000)","journal-title":"Nature"},{"key":"7_CR13","unstructured":"de Bra, P., Houben, G.-J., Kornatzky, Y.: Information Retrieval in Distributed Hypertexts. In: Proceedings of the 4th RIAO, Intelligent Multimedia, Information Retrieval Systems and Management, New York, NY, USA, pp. 481\u2013491 (1994), http:\/\/citeseer.ist.psu.edu\/debra94information.html"},{"key":"7_CR14","unstructured":"de Bra, P., Post, R.: Searching for arbitrary information in the WWW: The fish-search for Mosaic. In: Proceedings of the 2nd World Wide Web Conference. WWW2, Chicago, USA (1994), http:\/\/citeseer.ist.psu.edu\/172936.html"},{"key":"7_CR15","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1016\/S0169-7552(98)00110-X","volume":"30","author":"S. Brin","year":"1998","unstructured":"Brin, S., Page, L.: The Anatomy of a Large-Scale Hypertextual Web Search Engine. Computer Networks and ISDN Systems\u00a030, 107\u2013117 (1998)","journal-title":"Computer Networks and ISDN Systems"},{"key":"7_CR16","doi-asserted-by":"crossref","unstructured":"Broder, A., Kumar, R., Maghoul, F., Raghavan, P., Rajagopalan, S., Stata, R., Tomkins, A., Wiener, J.: Graph structure in the web. In: Proceedings of the 9th World Wide Web Conference. WWW9, Amsterdam, Netherlands, pp. 309\u2013320 (2000), http:\/\/www9.org\/w9cdrom\/160\/160.html","DOI":"10.1016\/S1389-1286(00)00083-9"},{"issue":"4es","key":"7_CR17","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1145\/345966.346007","volume":"31","author":"S. Chakrabarti","year":"1999","unstructured":"Chakrabarti, S.: Recent results in automatic Web resource discovery. ACM Computing Surveys\u00a031(4es), 17 (1999), doi:10.1145\/345966.346007","journal-title":"ACM Computing Surveys"},{"key":"7_CR18","doi-asserted-by":"publisher","first-page":"148","DOI":"10.1145\/511446.511466","volume-title":"Proceedings of the 11th international conference on World Wide Web","author":"S. Chakrabarti","year":"2002","unstructured":"Chakrabarti, S., Punera, K., Subramanyam, M.: Accelerated focused crawling through online relevance feedback. In: Proceedings of the 11th international conference on World Wide Web. WWW \u201902, pp. 148\u2013159. ACM Press, New York (2002), http:\/\/www2002.org\/CDROM\/refereed\/336\/"},{"key":"7_CR19","first-page":"375","volume-title":"Proceedings of the 25th International Conference on Very Large Data Bases","author":"S. Chakrabarti","year":"1999","unstructured":"Chakrabarti, S., van den Berg, M., Dom, B.: Distributed hypertext resource discovery through examples. In: Proceedings of the 25th International Conference on Very Large Data Bases. VLDB \u201999, pp. 375\u2013386. Morgan Kaufmann Publishers Inc, San Francisco (1999), http:\/\/www.vldb.org\/conf\/1999\/P37.pdf"},{"key":"7_CR20","doi-asserted-by":"crossref","unstructured":"Chakrabarti, S., van den Berg, M., Dom, B.: Focused Crawling: A New Approach to Topic-Specific Web Resource Discovery. In: Proceedings of the 8th World Wide Web Conference. WWW8, Toronto, Canada, pp. 1623\u20131640 (1999), http:\/\/www8.org\/w8-papers\/5a-search-query\/crawling\/index.html","DOI":"10.1016\/S1389-1286(99)00052-3"},{"issue":"7","key":"7_CR21","doi-asserted-by":"publisher","first-page":"604","DOI":"10.1002\/(SICI)1097-4571(19980515)49:7<604::AID-ASI3>3.0.CO;2-T","volume":"49","author":"H. Chen","year":"1998","unstructured":"Chen, H., Chung, Y.-M., Ramsey, M., Yang, C.C.: A smart itsy bitsy spider for the web. Journal of the American Society for Information Science\u00a049(7), 604\u2013618 (1998)","journal-title":"Journal of the American Society for Information Science"},{"key":"7_CR22","doi-asserted-by":"publisher","first-page":"490","DOI":"10.1145\/365024.365325","volume-title":"Proceedings of the ACM Conference on Human Factors in Computing Systems (CHI2001)","author":"E.H. Chi","year":"2001","unstructured":"Chi, E.H., Pirolli, P., Chen, K., Pitkow, J.: Using information scent to model user information needs and actions on the Web. In: Proceedings of the ACM Conference on Human Factors in Computing Systems (CHI2001), Seattle, WA, USA, pp. 490\u2013497. ACM Press, New York (2001)"},{"key":"7_CR23","first-page":"200","volume-title":"VLDB \u201900: Proceedings of the 26th International Conference on Very Large Data Bases","author":"J. Cho","year":"2000","unstructured":"Cho, J., Garcia-Molina, H.: The evolution of the web and implications for an incremental crawler. In: VLDB \u201900: Proceedings of the 26th International Conference on Very Large Data Bases, pp. 200\u2013209. Morgan Kaufmann, San Francisco (2000)"},{"key":"7_CR24","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1145\/342009.335391","volume-title":"SIGMOD \u201900: Proceedings of the 2000 ACM SIGMOD international conference on Management of data","author":"J. Cho","year":"2000","unstructured":"Cho, J., Garcia-Molina, H.: Synchronizing a database to improve freshness. In: SIGMOD \u201900: Proceedings of the 2000 ACM SIGMOD international conference on Management of data, Dallas, Texas, United States, pp. 117\u2013128. ACM Press, New York (2000), doi:10.1145\/342009.335391"},{"key":"7_CR25","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1145\/511446.511464","volume-title":"WWW \u201902: Proceedings of the 11th international conference on World Wide Web","author":"J. Cho","year":"2002","unstructured":"Cho, J., Garcia-Molina, H.: Parallel crawlers. In: WWW \u201902: Proceedings of the 11th international conference on World Wide Web, Honolulu, Hawaii, USA, pp. 124\u2013135. ACM Press, New York (2002), http:\/\/www2002.org\/CDROM\/refereed\/108\/index.html , doi:10.1145\/511446.511464"},{"issue":"3","key":"7_CR26","doi-asserted-by":"publisher","first-page":"256","DOI":"10.1145\/857166.857170","volume":"3","author":"J. Cho","year":"2003","unstructured":"Cho, J., Garcia-Molina, H.: Estimating frequency of change. ACM Transactions on Internet Technology (TOIT)\u00a03(3), 256\u2013290 (2003)","journal-title":"ACM Transactions on Internet Technology (TOIT)"},{"issue":"1\u20137","key":"7_CR27","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1016\/S0169-7552(98)00108-1","volume":"30","author":"J. Cho","year":"1998","unstructured":"Cho, J., Garcia-Molina, H., Page, L.: Efficient Crawling Through URL Ordering. Computer Networks and ISDN Systems\u00a030(1\u20137), 161\u2013172 (1998)","journal-title":"Computer Networks and ISDN Systems"},{"key":"7_CR28","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1145\/584792.584802","volume-title":"CIKM \u201902: Proceedings of the eleventh international conference on Information and knowledge management","author":"C. Chung","year":"2002","unstructured":"Chung, C., Clarke, C.L.A.: Topic-oriented collaborative crawling. In: CIKM \u201902: Proceedings of the eleventh international conference on Information and knowledge management, McLean, Virginia, USA, pp. 34\u201342. ACM Press, New York (2002), doi:10.1145\/584792.584802"},{"key":"7_CR29","doi-asserted-by":"publisher","first-page":"272","DOI":"10.1145\/345508.345597","volume-title":"SIGIR \u201900: Proceedings of the 23rd annual international ACM SIGIR conference on Research and development in information retrieval","author":"B.D. Davison","year":"2000","unstructured":"Davison, B.D.: Topical locality in the Web. In: SIGIR \u201900: Proceedings of the 23rd annual international ACM SIGIR conference on Research and development in information retrieval, Athens, Greece, pp. 272\u2013279. ACM Press, New York (2000), doi:10.1145\/345508.345597"},{"key":"7_CR30","doi-asserted-by":"publisher","first-page":"9","DOI":"10.1145\/1031453.1031457","volume-title":"WIDM \u201904: Proceedings of the 6th annual ACM international workshop on Web information and data management","author":"A. Carvalho Fontes de","year":"2004","unstructured":"de Carvalho Fontes, A., Silva, F.S.: SmartCrawl: a new strategy for the exploration of the hidden web. In: WIDM \u201904: Proceedings of the 6th annual ACM international workshop on Web information and data management, Washington DC, USA, pp. 9\u201315. ACM Press, New York (2004), doi:10.1145\/1031453.1031457"},{"key":"7_CR31","doi-asserted-by":"publisher","first-page":"208","DOI":"10.1145\/900051.900097","volume-title":"HYPERTEXT \u201903: Proceedings of the fourteenth ACM conference on Hypertext and hypermedia","author":"J.-Y. Delort","year":"2003","unstructured":"Delort, J.-Y., Bouchon-Meunier, B., Rifqi, M.: Enhanced web document summarization using hyperlinks. In: HYPERTEXT \u201903: Proceedings of the fourteenth ACM conference on Hypertext and hypermedia, Nottingham, UK, pp. 208\u2013215. ACM Press, New York (2003), doi:10.1145\/900051.900097"},{"key":"7_CR32","first-page":"527","volume-title":"VLDB \u201900: Proceedings of the 26th International Conference on Very Large Data Bases","author":"M. Diligenti","year":"2000","unstructured":"Diligenti, M., Coetzee, F., Lawrence, S., Giles, C.L., Gori, M.: Focused Crawling Using Context Graphs. In: VLDB \u201900: Proceedings of the 26th International Conference on Very Large Data Bases, pp. 527\u2013534. Morgan Kaufmann, San Francisco (2000), http:\/\/www.vldb.org\/conf\/2000\/P527.pdf"},{"key":"7_CR33","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1145\/1013367.1013441","volume-title":"WWW Alt. \u201904: Proceedings of the 13th international World Wide Web conference on Alternate track papers & posters","author":"M. Diligenti","year":"2004","unstructured":"Diligenti, M., Maggini, M., Pucci, F.M., Scarselli, F.: Design of a crawler with bounded bandwidth. In: WWW Alt. \u201904: Proceedings of the 13th international World Wide Web conference on Alternate track papers & posters, pp. 292\u2013293. ACM Press, New York (2004), http:\/\/www2004.org\/proceedings\/docs\/2p292.pdf , doi:10.1145\/1013367.1013441"},{"key":"7_CR34","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1145\/267658.267666","volume-title":"AGENTS \u201997: Proceedings of the first international conference on Autonomous agents","author":"R.B. Doorenbos","year":"1997","unstructured":"Doorenbos, R.B., Etzioni, O., Weld, D.S.: A scalable comparison-shopping agent for the World-Wide Web. In: AGENTS \u201997: Proceedings of the first international conference on Autonomous agents, pp. 39\u201348. ACM Press, New York (1997), doi:10.1145\/267658.267666"},{"key":"7_CR35","first-page":"1174","volume-title":"SAC \u201903: Proceedings of the 2003 ACM symposium on Applied computing","author":"M. Ehrig","year":"2004","unstructured":"Ehrig, M., Maedche, A.: Ontology-focused crawling of web documents. In: SAC 2003, pp. 1174\u20131178. ACM, New York (2004)"},{"key":"7_CR36","doi-asserted-by":"publisher","first-page":"669","DOI":"10.1145\/775152.775246","volume-title":"WWW \u201903: Proceedings of the 12th international conference on World Wide Web","author":"D. Fetterly","year":"2003","unstructured":"Fetterly, D., Manasse, M., Najork, M., Wiener, J.: A large-scale study of the evolution of web pages. In: WWW \u201903: Proceedings of the 12th international conference on World Wide Web, pp. 669\u2013678. ACM Press, New York (2003), http:\/\/www2003.org\/cdrom\/papers\/refereed\/p097\/P97%20sources\/p97-fetterly.html , doi:10.1145\/775152.775246"},{"key":"7_CR37","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1145\/258549.258800","volume-title":"CHI \u201997: Proceedings of the SIGCHI conference on Human factors in computing systems","author":"G.W. Furnas","year":"1997","unstructured":"Furnas, G.W.: Effective view navigation. In: CHI \u201997: Proceedings of the SIGCHI conference on Human factors in computing systems, pp. 367\u2013374. ACM Press, New York (1997), doi:10.1145\/258549.258800"},{"issue":"11","key":"7_CR38","doi-asserted-by":"publisher","first-page":"964","DOI":"10.1145\/32206.32212","volume":"30","author":"G.W. Furnas","year":"1987","unstructured":"Furnas, G.W., Landauer, T.K., Gomez, L.M., Dumais, S.T.: The vocabulary problem in human-system communication. Communications of the ACM\u00a030(11), 964\u2013971 (1987), doi:10.1145\/32206.32212","journal-title":"Communications of the ACM"},{"key":"7_CR39","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"crossref","first-page":"168","DOI":"10.1007\/978-3-540-45217-1_13","volume-title":"Cooperative Information Agents VII","author":"F. Gasparetti","year":"2003","unstructured":"Gasparetti, F., Micarelli, A.: Adaptive web search based on a colony of cooperative distributed agents. In: Klusch, M., Omicini, A., Ossowski, S., Laamanen, H. (eds.) CIA 2003. LNCS (LNAI), vol.\u00a02782, pp. 168\u2013183. Springer, Heidelberg (2003)"},{"key":"7_CR40","unstructured":"Gasparetti, F., Micarelli, A.: Swarm Intelligence: Agents for Adaptive Web Search. In: Proceedings of the 16th European Conference on Artificial Intelligence (ECAI 2004), pp. 1019\u20131020 (2004), http:\/\/citeseer.ist.psu.edu\/738711.html"},{"key":"7_CR41","doi-asserted-by":"crossref","unstructured":"Gasparetti, F., Micarelli, A.: User profile generation based on a memory retrieval theory. In: Proc. 1st International Workshop on Web Personalization, Recommender Systems and Intelligent User Interfaces (WPRSIUI\u201905), pp. 59\u201368 (2005), http:\/\/citeseer.ist.psu.edu\/gasparetti05user.html","DOI":"10.5220\/0001422500590068"},{"key":"7_CR42","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1007\/978-3-540-72079-9_2","volume-title":"The Adaptive Web: Methods and Strategies of Web Personalization","author":"S. Gauch","year":"2007","unstructured":"Gauch, S., Speretta, M., Chandramouli, A., Micarelli, A.: User profiles for personalized information access. In: Brusilovsky, P., Kobsa, A., Nejdl, W. (eds.) The Adaptive Web: Methods and Strategies of Web Personalization. LNCS, vol.\u00a04321, pp. 54\u201389. Springer, Heidelberg (2007)"},{"key":"7_CR43","doi-asserted-by":"publisher","first-page":"902","DOI":"10.1145\/1062745.1062789","volume-title":"WWW \u201905: Special interest tracks and posters of the 14th international conference on World Wide Web","author":"A. Gulli","year":"2005","unstructured":"Gulli, A., Signorini, A.: The indexable web is more than 11.5 billion pages. In: WWW \u201905: Special interest tracks and posters of the 14th international conference on World Wide Web, pp. 902\u2013903. ACM Press, New York (2005), http:\/\/www.cs.uiowa.edu\/~asignori\/web-size\/ , doi:10.1145\/1062745.1062789"},{"key":"7_CR44","doi-asserted-by":"crossref","unstructured":"Hersovicia, M., Jacovia, M., Maareka, Y.S., Pellegb, D., Shtalhaima, M., Ura, S.: The shark-search algorithm \u2013 An application: tailored Web site mapping. In: Proceedings of the 7th World Wide Web Conference (WWW7), Brisbane, Australia, pp. 317\u2013326 (1998), http:\/\/www7.scu.edu.au\/1849\/com1849.htm","DOI":"10.1016\/S0169-7552(98)00038-5"},{"issue":"4","key":"7_CR45","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1023\/A:1019213109274","volume":"2","author":"A. Heydon","year":"1999","unstructured":"Heydon, A., Najork, M.: Mercator: A scalable, extensible Web crawler. World Wide Web.\u00a02(4), 219\u2013229 (1999)","journal-title":"World Wide Web"},{"key":"7_CR46","unstructured":"Joachims, T., Freitag, D., Mitchell, T.M.: WebWatcher: A Tour Guide for the World Wide Web. In: Proceedings of the 15h International Conference on Artificial Intelligence (IJCAI1997), pp. 770\u2013777 (1997), http:\/\/citeseer.ist.psu.edu\/16829.html"},{"key":"7_CR47","first-page":"668","volume-title":"Proceedings of the 9th annual ACM-SIAM symposium on Discrete algorithms","author":"J. Kleinberg","year":"1998","unstructured":"Kleinberg, J.: Authoritative Sources in a Hyperlinked Environment. In: Proceedings of the 9th annual ACM-SIAM symposium on Discrete algorithms, San Francisco, CA, USA, pp. 668\u2013677. ACM Press, New York (1998), http:\/\/www.cs.cornell.edu\/home\/kleinber\/auth.pdf"},{"key":"7_CR48","doi-asserted-by":"publisher","first-page":"272","DOI":"10.1145\/354756.354829","volume-title":"CIKM \u201900: Proceedings of the ninth international conference on Information and knowledge management","author":"A. Kruger","year":"2000","unstructured":"Kruger, A., Giles, C.L., Coetzee, F.M., Glover, E., Flake, G.W., Lawrence, S., Omlin, C.: DEADLINER: building a new niche search engine. In: CIKM \u201900: Proceedings of the ninth international conference on Information and knowledge management, pp. 272\u2013281. ACM Press, New York (2000), http:\/\/citeseer.ist.psu.edu\/kruger00deadliner.html , doi:10.1145\/354756.354829"},{"key":"7_CR49","doi-asserted-by":"publisher","first-page":"568","DOI":"10.1145\/775152.775233","volume-title":"WWW \u201903: Proceedings of the 12th international conference on World Wide Web","author":"R. Kumar","year":"2003","unstructured":"Kumar, R., Novak, J., Raghavan, P., Tomkins, A.: On the bursty evolution of blogspace. In: WWW \u201903: Proceedings of the 12th international conference on World Wide Web, pp. 568\u2013576. ACM Press, New York (2003), http:\/\/www2003.org\/cdrom\/papers\/refereed\/p477\/p477-kumar\/p477-kumar.htm , doi:10.1145\/775152.775233"},{"issue":"2","key":"7_CR50","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1016\/j.datak.2003.10.003","volume":"49","author":"J.P. Lage","year":"2004","unstructured":"Lage, J.P., da Silva, A.S., Golgher, P.B., Laender, A.H.F.: Automatic generation of agents for collecting hidden web pages for data extraction. Data and Knowledge Engineering\u00a049(2), 177\u2013196 (2004)","journal-title":"Data and Knowledge Engineering"},{"key":"7_CR51","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1007\/978-3-7091-2490-1_12","volume-title":"UM \u201999: Proceedings of the seventh international conference on User modeling","author":"T. Lau","year":"1999","unstructured":"Lau, T., Horvitz, E.: Patterns of search: analyzing and modeling Web query refinement. In: UM \u201999: Proceedings of the seventh international conference on User modeling, Secaucus, NJ, USA, pp. 119\u2013128. Springer, New York (1999)"},{"key":"7_CR52","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1126\/science.280.5360.98","volume":"280","author":"S. Lawrence","year":"1998","unstructured":"Lawrence, S., Giles, L.C.: Searching the World Wide Web. Science\u00a0280, 98\u2013100 (1998)","journal-title":"Science"},{"key":"7_CR53","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1038\/21987","volume":"400","author":"S. Lawrence","year":"1999","unstructured":"Lawrence, S., Giles, L.C.: Accessibility of information on the web. Nature\u00a0400, 107\u2013109 (1999)","journal-title":"Nature"},{"issue":"2","key":"7_CR54","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1002\/swf.30","volume":"2","author":"M. Levene","year":"2001","unstructured":"Levene, M., Poulovassilis, A.: Web dynamics. Software Focus\u00a02(2), 60\u201367 (2001)","journal-title":"Software Focus"},{"issue":"2","key":"7_CR55","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1145\/568954.568958","volume":"1","author":"W.-H. Lu","year":"2002","unstructured":"Lu, W.-H., Chien, L.-F., Lee, H.-J.: Translation of web queries using anchor text mining. ACM Transactions on Asian Language Information Processing (TALIP)\u00a01(2), 159\u2013172 (2002), doi:10.1145\/568954.568958","journal-title":"ACM Transactions on Asian Language Information Processing (TALIP)"},{"key":"7_CR56","doi-asserted-by":"crossref","unstructured":"Marchiori, M.: The Quest for Correct Information on the Web: Hyper Search Engines. In: Proceedings of the 6th World Wide Web Conference (WWW6), Santa Clara, CA, USA, pp. 1225\u20131235 (1997), http:\/\/www.w3.org\/People\/Massimo\/papers\/WWW6\/","DOI":"10.1016\/S0169-7552(97)00036-6"},{"issue":"14","key":"7_CR57","doi-asserted-by":"publisher","first-page":"1261","DOI":"10.1002\/asi.20081","volume":"55","author":"F. Menczer","year":"2004","unstructured":"Menczer, F.: Lexical and semantic clustering by Web links. Journal of the American Society for Information Science and Technology\u00a055(14), 1261\u20131269 (2004)","journal-title":"Journal of the American Society for Information Science and Technology"},{"issue":"11\u201316","key":"7_CR58","first-page":"1653","volume":"31","author":"F. Menczer","year":"2000","unstructured":"Menczer, F., Belew, R.K.: Adaptive retrieval agents: Internalizing local context and scaling up to the Web. Machine Learning\u00a031(11\u201316), 1653\u20131665 (2000)","journal-title":"Machine Learning"},{"issue":"4","key":"7_CR59","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1145\/1031114.1031117","volume":"4","author":"F. Menczer","year":"2004","unstructured":"Menczer, F., Pant, G., Srinivasan, P.: Topical web crawlers: Evaluating adaptive algorithms. ACM Transactions on Internet Technology\u00a04(4), 378\u2013419 (2004)","journal-title":"ACM Transactions on Internet Technology"},{"key":"7_CR60","doi-asserted-by":"crossref","unstructured":"Metropolis, N., Rosenbluth, A.W., Rosenbluth, M.N., Teller, A., Teller, E.: Equations of State Calculations by Fast Computing Machines. Journal of Chemical Physics\u00a021(6) (1953)","DOI":"10.1063\/1.1699114"},{"key":"7_CR61","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1007\/978-3-540-72079-9_6","volume-title":"The Adaptive Web: Methods and Strategies of Web Personalization","author":"A. Micarelli","year":"2007","unstructured":"Micarelli, A., Gasparetti, F., Sciarrone, F., Gauch, S.: Personalized Search on the World Wide Web. In: Brusilovsky, P., Kobsa, A., Nejdl, W. (eds.) The Adaptive Web: Methods and Strategies of Web Personalization. LNCS, vol.\u00a04321, pp. 195\u2013230. Springer, Heidelberg (2007)"},{"key":"7_CR62","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"155","DOI":"10.1007\/978-3-540-72079-9_5","volume-title":"The Adaptive Web: Methods and Strategies of Web Personalization","author":"A. Micarelli","year":"2007","unstructured":"Micarelli, A., Sciarrone, F., Marinilli, M.: Web Document modeling. In: Brusilovsky, P., Kobsa, A., Nejdl, W. (eds.) The Adaptive Web: Methods and Strategies of Web Personalization. LNCS, vol.\u00a04321, pp. 155\u2013194. Springer, Heidelberg (2007)"},{"key":"7_CR63","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1145\/294469.294474","volume-title":"Proceedings of the 10th ACM Conference on Hypertext and Hypermedia: Returning to Our Diverse Roots (HYPERTEXT99)","author":"Y. Mizuuchi","year":"1999","unstructured":"Mizuuchi, Y., Tajima, K.: Finding Context Paths for Web Pages. In: Proceedings of the 10th ACM Conference on Hypertext and Hypermedia: Returning to Our Diverse Roots (HYPERTEXT99), Darmstadt, Germany, pp. 13\u201322. ACM Press, New York (1999)"},{"key":"7_CR64","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1007\/978-1-4615-0005-6_2","volume-title":"Handbook of massive data sets","author":"M. Najork","year":"2002","unstructured":"Najork, M., Heydon, A.: High-performance web crawling. In: Abello, J., Pardalos, P.M., Resende, M.G. (eds.) Handbook of massive data sets, pp. 25\u201345. Kluwer Academic Publishers, Norwell (2002)"},{"key":"7_CR65","doi-asserted-by":"crossref","unstructured":"Najork, M., Wiener, J.L.: Breadth-first search crawling yields high-quality pages. In: Proceedings of the 10th World Wide Web Conference (WWW10), Hong Kong, pp. 114\u2013118 (2001), http:\/\/www10.org\/cdrom\/papers\/208\/","DOI":"10.1145\/371920.371965"},{"key":"7_CR66","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/988672.988674","volume-title":"Proceedings of the 13th international conference on World Wide Web","author":"A. Ntoulas","year":"2004","unstructured":"Ntoulas, A., Cho, J., Olston, C.: What\u2019s new on the web?: the evolution of the web from a search engine perspective. In: Feldman, S.I., Uretsky, M., Najork, M., Wills, C.E. (eds.) Proceedings of the 13th international conference on World Wide Web. WWW 2004, New York, NY, USA, May 17-20, pp. 1\u201312. ACM Press, New York (2004), http:\/\/www2004.org\/proceedings\/docs\/1p1.pdf"},{"key":"7_CR67","doi-asserted-by":"publisher","first-page":"100","DOI":"10.1145\/1065385.1065407","volume-title":"Proceedings of ACM\/IEEE Joint Conference on Digital Libraries","author":"A. Ntoulas","year":"2005","unstructured":"Ntoulas, A., Zerfos, P., Cho, J.: Downloading textual hidden web content through keyword queries. In: Marlino, M., Sumner, T., Shipman, F. (eds.) Proceedings of ACM\/IEEE Joint Conference on Digital Libraries. JCDL 2005, Denver, CA, USA, June 7-11, pp. 100\u2013109. ACM, New York (2005)"},{"key":"7_CR68","unstructured":"Page, L., Brin, S., Motwani, R., Winograd, T.: The pagerank citation ranking: Bringing order to the web. Technical report, Stanford Digital Library Technologies Project (1998) http:\/\/dbpubs.stanford.edu\/pub\/1999-66"},{"key":"7_CR69","unstructured":"Pinkerton, B.: Finding What People Want: Experiences with the WebCrawler. In: Proceedings of the 2nd World Wide Web Conference (WWW2), Chicago, USA, pp. 821\u2013829 (1994)"},{"key":"7_CR70","doi-asserted-by":"publisher","first-page":"643","DOI":"10.1037\/0033-295X.106.4.643","volume":"106","author":"P. Pirolli","year":"1999","unstructured":"Pirolli, P., Card, S.K.: Information foraging. Psychological Review\u00a0106, 643\u2013675 (1999)","journal-title":"Psychological Review"},{"key":"7_CR71","first-page":"129","volume-title":"VLDB \u201901: Proceedings of the 27th International Conference on Very Large Data Bases","author":"S. Raghavan","year":"2001","unstructured":"Raghavan, S., Garcia-Molina, H.: Crawling the Hidden Web. In: VLDB \u201901: Proceedings of the 27th International Conference on Very Large Data Bases, pp. 129\u2013138. Morgan Kaufmann, San Francisco (2001)"},{"key":"7_CR72","first-page":"335","volume-title":"ICML \u201999: Proceedings of the Sixteenth International Conference on Machine Learning","author":"J. Rennie","year":"1999","unstructured":"Rennie, J., McCallum, A.: Using reinforcement learning to spider the web efficiently. In: ICML \u201999: Proceedings of the Sixteenth International Conference on Machine Learning, pp. 335\u2013343. Morgan Kaufmann Publishers Inc, San Francisco (1999), http:\/\/citeseer.ist.psu.edu\/7537.html"},{"key":"7_CR73","doi-asserted-by":"crossref","first-page":"318","DOI":"10.7551\/mitpress\/5236.001.0001","volume-title":"Parallel distributed processing: explorations in the microstructure of cognition, vol. 1: foundations","author":"D.E. Rumelhart","year":"1986","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J.: Learning internal representations by error propagation. In: Rumelhart, D.E., McClelland, J.L. (eds.) Parallel distributed processing: explorations in the microstructure of cognition, vol. 1: foundations, pp. 318\u2013362. MIT Press, Cambridge (1986)"},{"issue":"2","key":"7_CR74","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1016\/j.jnca.2004.01.001","volume":"28","author":"A. Rungsawang","year":"2005","unstructured":"Rungsawang, A., Angkawattanawit, N.: Learnable topic-specific web crawler. Journal of Network and Computer Applications\u00a028(2), 97\u2013114 (2005), doi:10.1016\/j.jnca.2004.01.001","journal-title":"Journal of Network and Computer Applications"},{"key":"7_CR75","volume-title":"Introduction to Modern Information Retrieval","author":"G. Salton","year":"1983","unstructured":"Salton, G., McGill, M.J.: Introduction to Modern Information Retrieval. McGraw-Hill, New York (1983)"},{"key":"7_CR76","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1109\/ICDE.2002.994750","volume-title":"Proceedings of the 18th International Conference on Data Engineering (ICDE\u201902)","author":"V. Shkapenyuk","year":"2002","unstructured":"Shkapenyuk, V., Suel, T.: Design and implementation of a high-performance distributed web crawler. In: Proceedings of the 18th International Conference on Data Engineering (ICDE\u201902), Washington, DC, USA, p. 357. IEEE Computer Society Press, Los Alamitos (2002)"},{"key":"7_CR77","unstructured":"Spink, A., Jansen, B.J.: A study of Web search trends. Webology\u00a01(2) (2004), http:\/\/www.webology.ir\/2004\/v1n2\/a4.html"},{"issue":"3","key":"7_CR78","doi-asserted-by":"publisher","first-page":"226","DOI":"10.1002\/1097-4571(2000)9999:9999<::AID-ASI1591>3.0.CO;2-R","volume":"52","author":"A. Spink","year":"2001","unstructured":"Spink, A., Wolfram, D., Jansen, M.B.J., Saracevic, T.: Searching the Web: the public and their queries. Journal of the American Society for Information Science\u00a052(3), 226\u2013234 (2001)","journal-title":"Journal of the American Society for Information Science"},{"issue":"3","key":"7_CR79","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1007\/s10791-005-6993-5","volume":"8","author":"P. Srinivasan","year":"2005","unstructured":"Srinivasan, P., Menczer, F., Pant, G.: A General Evaluation Framework for Topical Crawlers. Information Retrieval\u00a08(3), 417\u2013447 (2005)","journal-title":"Information Retrieval"},{"key":"7_CR80","unstructured":"Steele, R.: Techniques for Specialized Search Engines. In: Proc. Internet Computing 2001, Las Vegas, June 25\u201328 (2001), http:\/\/citeseer.ist.psu.edu\/steele01techniques.html"},{"key":"7_CR81","volume-title":"Introduction to Reinforcement Learning","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Introduction to Reinforcement Learning. MIT Press, Cambridge (1998)"},{"issue":"2","key":"7_CR82","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1016\/S0167-9236(99)00091-3","volume":"28","author":"C.C. Yang","year":"2000","unstructured":"Yang, C.C., Yen, J., Chen, H.: Intelligent Internet searching agent based on hybrid simulated annealing. Decision Support Systems\u00a028(2), 269\u2013277 (2000)","journal-title":"Decision Support Systems"},{"key":"7_CR83","doi-asserted-by":"crossref","unstructured":"Yuwono, B., Lam, S.L.Y., Ying, J.H., Lee, D.L.: A World Wide Web Resource Discovery System. In: Proceedings of the 4th World Wide Web Conference (WWW4), Boston, Massachusetts, USA, pp. 145\u2013158 (1995), http:\/\/www.w3.org\/Conferences\/WWW4\/Papers\/66\/","DOI":"10.1145\/3592626.3592637"}],"container-title":["Lecture Notes in Computer Science","The Adaptive Web"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-72079-9_7.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T07:42:11Z","timestamp":1737013331000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-72079-9_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540720782"],"references-count":83,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-72079-9_7","relation":{},"subject":[]}}