{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T18:08:59Z","timestamp":1725991739998},"publisher-location":"Berlin, Heidelberg","reference-count":36,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783662580387"},{"type":"electronic","value":"9783662580394"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-662-58039-4_4","type":"book-chapter","created":{"date-parts":[[2018,9,16]],"date-time":"2018-09-16T06:39:40Z","timestamp":1537079980000},"page":"61-78","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["$${{\\textsc {ber}}}_{y}{\\textsc {l}}$$BERyL: A System for Web Block Classification"],"prefix":"10.1007","author":[{"given":"Andrey","family":"Kravchenko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,9,16]]},"reference":[{"key":"4_CR1","unstructured":"Abiteboul, S., Hull, R., Vianu, V.: Foundations of Databases. Addison-Wesley Longman Publishing Co. Inc., Boston (1995)"},{"key":"4_CR2","unstructured":"Baumgartner, R., Flesca, S., Gottlob, G.: Visual web information extraction with Lixto. In: VLDB (2001)"},{"key":"4_CR3","doi-asserted-by":"crossref","unstructured":"Baluja, S.: Browsing on small screens: recasting web-page segmentation into an efficient machine learning framework. In: WWW 2006 (2006)","DOI":"10.1145\/1135777.1135788"},{"key":"4_CR4","doi-asserted-by":"crossref","unstructured":"Burget, R., Rudolfova, I.: Web page element classification based on visual features. In: 2009 First Asia Conference on Intelligent Information and Database Systems (2009)","DOI":"10.1109\/ACIIDS.2009.71"},{"key":"4_CR5","doi-asserted-by":"crossref","unstructured":"Cai, D., Yu, S., Wen, J., Ma, W.: Block-based web search. In: SIGIR 2004, 25\u201329 July 2004 (2004)","DOI":"10.1145\/1008992.1009070"},{"key":"4_CR6","doi-asserted-by":"crossref","unstructured":"Cai, D., He, X., Wen, J., Ma, W.: Block-level link analysis. In: SIGIR 2004, 25\u201329 July 2004 (2004)","DOI":"10.1145\/1008992.1009068"},{"key":"4_CR7","doi-asserted-by":"crossref","unstructured":"Cao, Y., Niu, Z., Dai, L., Zhao, Y.: Extraction of informative blocks from web pages. In: ALPIT 2008 (2008)","DOI":"10.1109\/ALPIT.2008.106"},{"key":"4_CR8","unstructured":"Chen, J., Zhou, B., Shi, J., Zhang, H., Fengwu, Q.: Function-based object model towards website adaptation. In: WWW 2010, 1\u20135 May 2010 (2010)"},{"key":"4_CR9","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-24206-9","volume-title":"Datalog Reloaded","year":"2011","unstructured":"de Moor, O., Gottlob, G., Furche, T., Sellers, A. (eds.): Datalog 2.0 2010. LNCS, vol. 6702. Springer, Heidelberg (2011). https:\/\/doi.org\/10.1007\/978-3-642-24206-9"},{"key":"4_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"332","DOI":"10.1007\/978-3-642-31753-8_27","volume-title":"Web Engineering","author":"T Furche","year":"2012","unstructured":"Furche, T., Grasso, G., Kravchenko, A., Schallhart, C.: Turn the page: automated traversal of paginated websites. In: Brambilla, M., Tokuda, T., Tolksdorf, R. (eds.) ICWE 2012. LNCS, vol. 7387, pp. 332\u2013346. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-31753-8_27"},{"key":"4_CR11","doi-asserted-by":"crossref","unstructured":"Furche, T., et al.: DIADEM: domain-centric, intelligent, automated data extraction methodology. In: WWW 2012 (2012)","DOI":"10.1145\/2187980.2188025"},{"issue":"4","key":"4_CR12","doi-asserted-by":"publisher","first-page":"349","DOI":"10.1007\/s10032-010-0136-2","volume":"14","author":"Aman Goel","year":"2010","unstructured":"Goel, A., Michelson, M., Knoblock, C.A.: Harvesting maps on the web. Int. J. Doc. Anal. Recognit. 14(4), 349 (2011)","journal-title":"International Journal on Document Analysis and Recognition (IJDAR)"},{"key":"4_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"54","DOI":"10.1007\/978-3-642-33158-9_2","volume-title":"Reasoning Web. Semantic Technologies for Advanced Query Answering","author":"G Gottlob","year":"2012","unstructured":"Gottlob, G., Orsi, G., Pieris, A., \u0160imkus, M.: Datalog and its extensions for semantic web databases. In: Eiter, T., Krennwallner, T. (eds.) Reasoning Web 2012. LNCS, vol. 7487, pp. 54\u201377. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-33158-9_2"},{"key":"4_CR14","doi-asserted-by":"crossref","unstructured":"Gupta, S., Kaiser, G., Neistadt, D., Grimm, P.: DOM-based content extraction of HTML documents. In: WWW 2003, 20\u201324 May 2003 (2003)","DOI":"10.1145\/775181.775182"},{"key":"4_CR15","doi-asserted-by":"crossref","unstructured":"Kang, J., Choi, J.: Block classification of a web page by using a combination of multiple classifiers. In: Fourth International Conference on Networked Computing and Advanced Information Management, 2\u20134 September 2008 (2008)","DOI":"10.1109\/NCM.2008.170"},{"key":"4_CR16","unstructured":"Kang, J., Choi, J.: Recognising informative web page blocks using visual segmentation for efficient information extraction. J. Univ. Comput. Sci. 14(11), 1893 (2008)"},{"key":"4_CR17","doi-asserted-by":"crossref","unstructured":"Keller, M., Hartenstein, H.: GRABEX: a graph-based method for web site block classification and its application on mining breadcrumb trails. In: 2013 IEEE\/WIC\/ACM International Conferences on Web Intelligence (WI) and Intelligent Agent Technology (IAT) (2013)","DOI":"10.1109\/WI-IAT.2013.42"},{"key":"4_CR18","doi-asserted-by":"crossref","unstructured":"Kordomatis, I., Herzog, C., Fayzrakhmanov, R.R., Kr\u00fcpl-Sypien, B., Holzinger, W., Baumgartner, R.: Web object identification for web automation and meta-search. In: WIMS 2013 (2012)","DOI":"10.1145\/2479787.2479798"},{"key":"4_CR19","doi-asserted-by":"crossref","unstructured":"Kr\u00fcpl-Sypien, B., Fayzrakhmanov, R.R., Holzinger, W., Panzenb\u00f6ck, M., Baumgartner, R.: A versatile model for web page representation, information extraction and content re-packaging. In: DocEng 2011, 19\u201322 September 2011 (2011)","DOI":"10.1145\/2034691.2034721"},{"key":"4_CR20","doi-asserted-by":"crossref","unstructured":"Lee, C.H., Kan, M., Lai, S.: Stylistic and lexical co-training for web block classification. In: WIDM 2004, 12\u201313 November 2004 (2004)","DOI":"10.1145\/1031453.1031478"},{"key":"4_CR21","unstructured":"Li, C., Dong, J., Chen, J.: Extraction of informative blocks from web pages based on VIPS. J. Comput. Inf. Syst. 6(1), 271 (2010)"},{"issue":"3","key":"4_CR22","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1109\/TKDE.2009.109","volume":"22","author":"Wei Liu","year":"2010","unstructured":"Liu, W., Meng, X.: VIDE: a vision-based approach for deep web data extraction. IEEE Trans. Knowl. Data Engineering 22(3), 447 (2010)","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"4_CR23","doi-asserted-by":"crossref","unstructured":"Luo, P., Lin, F., Xiong, Y., Zhao, Y., Shi, Z.: Towards combining web classification and web information extraction: a case study. In: KDD 2009, 28 June\u20131 July (2009)","DOI":"10.1145\/1557019.1557152"},{"key":"4_CR24","doi-asserted-by":"crossref","unstructured":"Maekawa, T., Hara, T., Nishio, S.: Image classification for mobile web browsing. In: WWW 2006, 23\u201326 May (2006)","DOI":"10.1145\/1135777.1135789"},{"key":"4_CR25","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1007\/978-3-540-28637-0_43","volume-title":"Mobile Human-Computer Interaction - MobileHCI 2004","author":"R Romero","year":"2004","unstructured":"Romero, R., Berger, A.: Automatic partitioning of web pages using clustering. In: Brewster, S., Dunlop, M. (eds.) Mobile HCI 2004. LNCS, vol. 3160, pp. 388\u2013393. Springer, Heidelberg (2004). https:\/\/doi.org\/10.1007\/978-3-540-28637-0_43"},{"key":"4_CR26","doi-asserted-by":"crossref","unstructured":"Song, R., Liu, H., Wen, J., Ma, W.: Learning block importance models for web pages. In: WWW 2004, 17\u201322 May (2004)","DOI":"10.1145\/988672.988700"},{"key":"4_CR27","doi-asserted-by":"crossref","unstructured":"Vadrevu, S., Velipasaoglu, E.: Identifying primary content from web page and its application to web search ranking. In: WWW 2011 (2011)","DOI":"10.1145\/1963192.1963261"},{"key":"4_CR28","doi-asserted-by":"crossref","unstructured":"Wang, J., et al.: Can we learn a template-independent wrapper for news article extraction from a single training site? In: KDD 2009, 28 June\u20131 July (2009)","DOI":"10.1145\/1557019.1557163"},{"key":"4_CR29","doi-asserted-by":"crossref","unstructured":"Wu, C., Zeng, G., Xu, G.: A web page segmentation algorithm for extracting product information. In: Proceedings of the 2006 IEEE International Conference on Information Acquisition, 20\u201323 August 2006 (2006)","DOI":"10.1109\/ICIA.2006.305954"},{"key":"4_CR30","doi-asserted-by":"crossref","unstructured":"Xiang, P., Yang, X., Shi, Y.: Effective page segmentation combining pattern analysis and visual separators for browsing on small screens. In: Proceedings of the 2006 IEEE\/WIC\/ACM International Conference on Web Intelligence (2006)","DOI":"10.1109\/WI.2006.67"},{"key":"4_CR31","doi-asserted-by":"crossref","unstructured":"Xiang, P., Yang, X., Shi, Y.: Web page segmentation based on gestalt theory. In: 2007 IEEE International Conference on Multimedia and Expo (2007)","DOI":"10.1109\/ICME.2007.4285135"},{"key":"4_CR32","doi-asserted-by":"crossref","unstructured":"Yang, X., Shi, Y.: Learning web block functions using roles of images. In: Third International Conference on Pervasive Computing and Applications, 6\u20138 October 2008 (2008)","DOI":"10.1109\/ICPCA.2008.4783565"},{"key":"4_CR33","doi-asserted-by":"crossref","unstructured":"Yi, L., Liu, B., Li, X.: Eliminating noisy information in web pages for data mining. In: SIGKDD 2003, 24\u201327 August 2003 (2003)","DOI":"10.1145\/956755.956785"},{"key":"4_CR34","doi-asserted-by":"crossref","unstructured":"Yu, S., Cai, D., Wen, J., Ma, W.: Improving pseudo-relevance feedback in web information retrieval using web page segmentation. In: WWW 2003, 20\u201324 May 2003 (2003)","DOI":"10.1145\/775152.775155"},{"key":"4_CR35","doi-asserted-by":"crossref","unstructured":"Zheng, S., Song, R., Wen, J., Giles, C.L.: Efficient record-level wrapper induction. In: CIKM 2009, 2\u20136 November 2009 (2009)","DOI":"10.1145\/1645953.1645962"},{"key":"4_CR36","doi-asserted-by":"crossref","unstructured":"Zhu, J., Nie, Z., Wen, J., Zhang, B., Ma, W.: Simultaneous record detection and attribute labeling in web data extraction. In: KDD 2006, 20\u201323 August 2006 (2006)","DOI":"10.1145\/1150402.1150457"}],"container-title":["Lecture Notes in Computer Science","Transactions on Computational Science XXXIII"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-662-58039-4_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T14:03:00Z","timestamp":1662040980000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-662-58039-4_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783662580387","9783662580394"],"references-count":36,"URL":"https:\/\/doi.org\/10.1007\/978-3-662-58039-4_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2018]]}}}