{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T17:23:04Z","timestamp":1743096184801,"version":"3.40.3"},"publisher-location":"Cham","reference-count":10,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319255170"},{"type":"electronic","value":"9783319255187"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-25518-7_7","type":"book-chapter","created":{"date-parts":[[2015,9,30]],"date-time":"2015-09-30T00:20:51Z","timestamp":1443572451000},"page":"81-92","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Information Extraction from Web Sources Based on Multi-aspect Content Analysis"],"prefix":"10.1007","author":[{"given":"Martin","family":"Milicka","sequence":"first","affiliation":[]},{"given":"Radek","family":"Burget","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,1,7]]},"reference":[{"key":"7_CR1","unstructured":"Bos, B., Lie, H.W., Lilley, C., Jacobs, I.: Cascading style sheets, level 2, CSS2 specification. The World Wide Web Consortium (1998)"},{"key":"7_CR2","doi-asserted-by":"crossref","unstructured":"Burget, R.: Layout based information extraction from HTML documents. In: ICDAR 2007, pp. 624\u2013629. IEEE Computer Society (2007)","DOI":"10.1109\/ICDAR.2007.4376990"},{"key":"7_CR3","doi-asserted-by":"crossref","unstructured":"Burget, R., Rudolfov\u00e1, I.: Web page element classification based on visual features. In: 1st Asian Conference on Intelligent Information and Database Systems ACIIDS 2009, pp. 67\u201372. IEEE Computer Society (2009)","DOI":"10.1109\/ACIIDS.2009.71"},{"key":"7_CR4","unstructured":"Cai, D., Yu, S., Wen, J.R., Ma, W.Y.: VIPS: a Vision-based page segmentation algorithm. Microsoft Research (2003)"},{"key":"7_CR5","doi-asserted-by":"crossref","unstructured":"Finkel, J.R., Grenager, T., Manning, C.: Incorporating non-local information into information extraction systems by gibbs sampling. In: Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics, ACL 2005, pp. 363\u2013370 (2005)","DOI":"10.3115\/1219840.1219885"},{"issue":"2","key":"7_CR6","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1016\/j.datak.2009.10.002","volume":"69","author":"JL Hong","year":"2010","unstructured":"Hong, J.L., Siew, E.G., Egerton, S.: Information extraction for search engines using fast heuristic techniques. Data Knowl. Eng. 69(2), 169\u2013196 (2010). \n                    http:\/\/dx.doi.org\/10.1016\/j.datak.2009.10.002","journal-title":"Data Knowl. Eng."},{"key":"7_CR7","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1007\/3-540-44794-6_18","volume-title":"Principles of Data Mining and Knowledge Discovery","author":"TW Hong","year":"2001","unstructured":"Hong, T.W., Clark, K.L.: Using grammatical inference to automate information extraction from the web. In: Siebes, A., De Raedt, L. (eds.) PKDD 2001. LNCS (LNAI), vol. 2168, pp. 216\u2013227. Springer, Heidelberg (2001)"},{"key":"7_CR8","series-title":"Communications in Computer and Information Science","doi-asserted-by":"crossref","first-page":"89","DOI":"10.1007\/978-3-319-12024-9_11","volume-title":"Semantic Web Evaluation Challenge","author":"M Kolchin","year":"2014","unstructured":"Kolchin, M., Kozlov, F.: A template-based information extraction from web sites with unstable markup. In: Presutti, V., et al. (eds.) SemWebEval 2014. CCIS, vol. 475, pp. 89\u201394. Springer, Heidelberg (2014). \n                    http:\/\/dx.doi.org\/10.1007\/978-3-319-12024-9_11"},{"key":"7_CR9","unstructured":"Milicka, M., Burget, R.: Multi-aspect document content analysis using ontological modelling. In: Proceedings of 9th Workshop on Intelligent and Knowledge Oriented Technologies (WIKT 2014), pp. 9\u201312. Vydavate\u013astvo STU (2014)"},{"key":"7_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"404","DOI":"10.1007\/978-3-642-37401-2_41","volume-title":"Web Technologies and Applications","author":"Y You","year":"2013","unstructured":"You, Y., Xu, G., Cao, J., Zhang, Y., Huang, G.: Leveraging visual features and hierarchical dependencies for conference information extraction. In: Ishikawa, Y., Li, J., Wang, W., Zhang, R., Zhang, W. (eds.) APWeb 2013. LNCS, vol. 7808, pp. 404\u2013416. Springer, Heidelberg (2013). \n                    http:\/\/dx.doi.org\/10.1007\/978-3-642-37401-2_41"}],"container-title":["Communications in Computer and Information Science","Semantic Web Evaluation Challenges"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-25518-7_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,30]],"date-time":"2019-05-30T22:51:52Z","timestamp":1559256712000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-25518-7_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319255170","9783319255187"],"references-count":10,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-25518-7_7","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2015]]},"assertion":[{"value":"7 January 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}