{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T16:57:11Z","timestamp":1725901031078},"publisher-location":"Berlin, Heidelberg","reference-count":19,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642317521"},{"type":"electronic","value":"9783642317538"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-31753-8_27","type":"book-chapter","created":{"date-parts":[[2012,7,21]],"date-time":"2012-07-21T02:21:08Z","timestamp":1342837268000},"page":"332-346","source":"Crossref","is-referenced-by-count":8,"title":["Turn the Page: Automated Traversal of Paginated Websites"],"prefix":"10.1007","author":[{"given":"Tim","family":"Furche","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giovanni","family":"Grasso","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrey","family":"Kravchenko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christian","family":"Schallhart","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"6","key":"27_CR1","doi-asserted-by":"publisher","first-page":"886","DOI":"10.1016\/j.is.2006.09.004","volume":"32","author":"G. Almpanidis","year":"2007","unstructured":"Almpanidis, G., Kotropoulos, C., Pitas, I.: Combining text and link analysis for focused crawling - an application for vertical search engines. Inf. Syst.\u00a032(6), 886\u2013908 (2007)","journal-title":"Inf. Syst."},{"issue":"2","key":"27_CR2","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1016\/0169-7552(94)90132-5","volume":"27","author":"P.D. Bra","year":"1994","unstructured":"Bra, P.D., Post, R.D.J.: Information retrieval in the world-wide web: Making client-based searching feasible. Computer Networks and ISDN Systems\u00a027(2), 183\u2013192 (1994)","journal-title":"Computer Networks and ISDN Systems"},{"doi-asserted-by":"crossref","unstructured":"Chakrabarti, S., Berg, M.V.D., Dom, B.: Focused crawling: a new approach to topic-specific web resource discovery. In: Computer Networks, pp. 1623\u20131640 (1999)","key":"27_CR3","DOI":"10.1016\/S1389-1286(99)00052-3"},{"issue":"5","key":"27_CR4","doi-asserted-by":"publisher","first-page":"731","DOI":"10.1145\/1017460.1017462","volume":"51","author":"V. Crescenzi","year":"2004","unstructured":"Crescenzi, V., Mecca, G.: Automatic information extraction from large websites. J. ACM\u00a051(5), 731\u2013779 (2004)","journal-title":"J. ACM"},{"unstructured":"Cunningham, H., Maynard, D., Bontcheva, K., Tablan, V., Aswani, N., Roberts, I., Gorrell, G., Funk, A., Roberts, A., Damljanovic, D., Heitz, T., Greenwood, M.A., Saggion, H., Petrak, J., Li, Y., Peters, W.: Text Processing with GATE, Version 6 (2011)","key":"27_CR5"},{"unstructured":"Diligenti, M., Coetzee, F.M., Lawrence, S., Giles, C.L., Gori, M.: Focused crawling using context graphs. In: VLDB, pp. 527\u2013534 (2000)","key":"27_CR6"},{"key":"27_CR7","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1007\/s10115-009-0275-2","volume":"26","author":"B. Fazzinga","year":"2011","unstructured":"Fazzinga, B., Flesca, S., Tagarelli, A.: Schema-based web wrapping. Knowledge and Inf. Sys.\u00a026, 127\u2013173 (2011)","journal-title":"Knowledge and Inf. Sys."},{"issue":"1-7","key":"27_CR8","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1016\/S0169-7552(98)00038-5","volume":"30","author":"M. Hersovici","year":"1998","unstructured":"Hersovici, M., Jacovi, M., Maarek, Y.S., Pelleg, D., Shtalhaim, M., Ur, S.: The shark-search algorithm. an application: tailored web site mapping. Computer Networks and ISDN Systems\u00a030(1-7), 317\u2013326 (1998)","journal-title":"Computer Networks and ISDN Systems"},{"doi-asserted-by":"crossref","unstructured":"Kang, J., Choi, J.: Block classification of a web page by using a combination of multiple classifiers. In: NCM (2008)","key":"27_CR9","DOI":"10.1109\/NCM.2008.170"},{"doi-asserted-by":"crossref","unstructured":"Lee, C.H., Ken, M.Y., Lai, S.: Stylistic and lexical co-training for web block classification. In: WIDM (2004)","key":"27_CR10","DOI":"10.1145\/1031453.1031478"},{"doi-asserted-by":"crossref","unstructured":"Liu, H., Janssen, J., Milios, E.: Using HMM to learn user browsing patterns for focused web crawling. DKE\u00a059(2) (2006)","key":"27_CR11","DOI":"10.1016\/j.datak.2006.01.012"},{"issue":"4","key":"27_CR12","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1145\/1095872.1095875","volume":"23","author":"G. Pant","year":"2005","unstructured":"Pant, G., Srinivasan, P.: Learning to crawl: Comparing classification schemes. TOIS\u00a023(4), 430\u2013462 (2005)","journal-title":"TOIS"},{"issue":"1","key":"27_CR13","first-page":"107","volume":"18","author":"G. Pant","year":"2006","unstructured":"Pant, G., Srinivasan, P.: Link contexts in classifier-guided topical crawlers. TKDE\u00a018(1), 107\u2013122 (2006)","journal-title":"TKDE"},{"doi-asserted-by":"crossref","unstructured":"Song, R., Liu, H., Wen, J.-R., Ma, W.-Y.: Learning block importance model for web pages. In: WWW (2004)","key":"27_CR14","DOI":"10.1145\/988672.988700"},{"key":"27_CR15","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1007\/s10791-005-6993-5","volume":"8","author":"P. Srinivasan","year":"2005","unstructured":"Srinivasan, P., Menczer, F., Pant, G.: A general evaluation framework for topical crawlers. Inf. Retrieval\u00a08, 417\u2013447 (2005)","journal-title":"Inf. Retrieval"},{"doi-asserted-by":"crossref","unstructured":"Wang, J., Chen, C., Wang, C., Pei, J., Bu, J., Guan, Z., Zhang, W.V.: Can we learn a template-independent wrapper for news article extraction from a single training site? In: KDD (2009)","key":"27_CR16","DOI":"10.1145\/1557019.1557163"},{"doi-asserted-by":"crossref","unstructured":"Yang, X., Shi, Y.: Learning web page block functions using roles of images. In: ICPCA (2008)","key":"27_CR17","DOI":"10.1109\/ICPCA.2008.4783565"},{"doi-asserted-by":"crossref","unstructured":"Zhai, Y., Liu, B.: Web data extraction based on partial tree alignment. In: WWW (2005)","key":"27_CR18","DOI":"10.1145\/1060745.1060761"},{"doi-asserted-by":"crossref","unstructured":"Zheng, S., Song, R., Wen, J.-R., Giles, C.L.: Efficient record-level wrapper induction. In: CIKM (2009)","key":"27_CR19","DOI":"10.1145\/1645953.1645962"}],"container-title":["Lecture Notes in Computer Science","Web Engineering"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-31753-8_27.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,4]],"date-time":"2021-05-04T07:47:08Z","timestamp":1620114428000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-31753-8_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642317521","9783642317538"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-31753-8_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}