{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,8]],"date-time":"2025-10-08T22:21:28Z","timestamp":1759962088052},"publisher-location":"Berlin, Heidelberg","reference-count":13,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540720348"},{"type":"electronic","value":"9783540720355"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-72035-5_30","type":"book-chapter","created":{"date-parts":[[2007,6,5]],"date-time":"2007-06-05T16:02:15Z","timestamp":1181059335000},"page":"391-397","source":"Crossref","is-referenced-by-count":10,"title":["Automatic Document Structure Detection for Data Integration"],"prefix":"10.1007","author":[{"given":"Radek","family":"Burget","sequence":"first","affiliation":[]}],"member":"297","reference":[{"key":"30_CR1","doi-asserted-by":"crossref","unstructured":"Chen, J., et al.: Function-based object model towards website adaptation. In: Proceedings of the 10th International Wold Wide Web Conference (2001)","DOI":"10.1145\/371920.372161"},{"key":"30_CR2","doi-asserted-by":"crossref","unstructured":"Gupta, S., et al.: Dom-based content extraction of html documents. In: WWW2003 proceedings of the 12 Web Conference, pp. 207\u2013214 (2003)","DOI":"10.1145\/775152.775182"},{"key":"30_CR3","doi-asserted-by":"crossref","unstructured":"Kovacevic, M., et al.: Recognition of common areas in a web page using visual information: a possible application in a page classification. In: Proceedings of 2002 IEEE International Conference on Data (2002)","DOI":"10.1109\/ICDM.2002.1183910"},{"key":"30_CR4","volume-title":"International Conference on Document Analysis and Recognition","author":"S. Mukherjee","year":"2003","unstructured":"Mukherjee, S., et al.: Automatic discovery of semantic structures in html documents. In: International Conference on Document Analysis and Recognition, IEEE Computer Society Press, Los Alamitos (2003)"},{"key":"30_CR5","unstructured":"Cai, D., et al.: VIPS: a Vision-based Page Segmentation Algorithm. Microsoft Research (2003)"},{"key":"30_CR6","doi-asserted-by":"crossref","unstructured":"Gu, X.D., et al.: Visual based content understanding towards web adaptation. In: Proc. Adaptive Hypermedia and Adaptive Web-Based Systems, pp. 164\u2013173 (2002)","DOI":"10.1007\/3-540-47952-X_18"},{"key":"30_CR7","unstructured":"Hassan, T., Baumgartner, R.: Intelligent wrapping from pdf documents with lixto. In: RAWS 2005, FEI VB, pp. 17\u201324 (2005)"},{"key":"30_CR8","volume-title":"18th International Conference on Data Engineering","author":"C.Y. Chung","year":"2002","unstructured":"Chung, C.Y., Gertz, M., Sundaresan, N.: Reverse engineering for web data: From visual to semantic structures. In: 18th International Conference on Data Engineering, IEEE Computer Society Press, Los Alamitos (2002)"},{"key":"30_CR9","doi-asserted-by":"publisher","first-page":"859","DOI":"10.1109\/ICDAR.2001.953909","volume-title":"ICDAR \u201901: Proceedings of the Sixth International Conference on Document Analysis and Recognition, Seattle","author":"Y. Yang","year":"2001","unstructured":"Yang, Y., Zhang, H.: HTML page analysis based on visual cues. In: ICDAR \u201901: Proceedings of the Sixth International Conference on Document Analysis and Recognition, Seattle, Seattle, USA, p. 859. IEEE Computer Society, Los Alamitos (2001)"},{"key":"30_CR10","volume-title":"Proceedings of the 21st National Conference on Artificial Intelligence (AAAI\u00a02006)","author":"W. Gatterbauer","year":"2006","unstructured":"Gatterbauer, W., Bohunsky, P.: Table extraction using spatial reasoning on the CSS2 visual box model. In: Proceedings of the 21st National Conference on Artificial Intelligence (AAAI\u00a02006), July 2006, MIT Press, Cambridge (2006)"},{"key":"30_CR11","doi-asserted-by":"publisher","first-page":"933","DOI":"10.1145\/1135777.1135951","volume-title":"WWW \u201906: Proceedings of the 15th international conference on World Wide Web","author":"B. Kruepl","year":"2006","unstructured":"Kruepl, B., Herzog, M.: Visually guided bottom-up table detection and segmentation in web documents. In: WWW \u201906: Proceedings of the 15th international conference on World Wide Web, pp. 933\u2013934. ACM Press, New York (2006)"},{"key":"30_CR12","doi-asserted-by":"publisher","first-page":"186","DOI":"10.1109\/DEXA.2004.1333471","volume-title":"15th International Workshop on Database and Expert Systems Applications","author":"R. Burget","year":"2004","unstructured":"Burget, R.: Hierarchies in html documents: Linking text to concepts. In: 15th International Workshop on Database and Expert Systems Applications, pp. 186\u2013190. IEEE Computer Society, Los Alamitos (2004)"},{"key":"30_CR13","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1145\/988672.988700","volume-title":"WWW \u201904: Proceedings of the 13th international conference on World Wide Web","author":"R. Song","year":"2004","unstructured":"Song, R., et al.: Learning block importance models for web pages. In: WWW \u201904: Proceedings of the 13th international conference on World Wide Web, pp. 203\u2013211. ACM Press, New York (2004)"}],"container-title":["Lecture Notes in Computer Science","Business Information Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-72035-5_30.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,19]],"date-time":"2020-11-19T05:28:25Z","timestamp":1605763705000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-72035-5_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540720348","9783540720355"],"references-count":13,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-72035-5_30","relation":{},"subject":[]}}