{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T09:39:40Z","timestamp":1729676380390,"version":"3.28.0"},"reference-count":21,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2004]]},"DOI":"10.1109\/dexa.2004.1333471","type":"proceedings-article","created":{"date-parts":[[2004,11,8]],"date-time":"2004-11-08T16:27:50Z","timestamp":1099931270000},"page":"186-190","source":"Crossref","is-referenced-by-count":7,"title":["Hierarchies in HTML documents: linking text to concepts"],"prefix":"10.1109","author":[{"given":"R.","family":"Burget","sequence":"first","affiliation":[]}],"member":"263","reference":[{"key":"19","article-title":"Learning to extract text-based information from the World Wide Web","author":"soderland","year":"1997","journal-title":"Proc Third Int l Conf Knowledge Discovery and Data Mining (KDD 97)"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2003.1227667"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1109\/SSDM.2002.1029709"},{"key":"15","article-title":"Wrapper induction for information extraction","author":"kushmerick","year":"1997","journal-title":"International Joint Conference on Artificial Intelligence"},{"key":"16","article-title":"A bottom-up approach for integration of XML sources","author":"dos santos mello","year":"2001","journal-title":"Proc Int l Workshop on Information Integration on the Web"},{"journal-title":"Combining Visual Layout and Lexical Cohesion Features for Text Segmentation","year":"2001","author":"kan","key":"13"},{"key":"14","doi-asserted-by":"crossref","DOI":"10.1007\/3-540-45681-3_25","article-title":"Information extraction in structured documents using tree automata induction","author":"kosala","year":"2002","journal-title":"Principles of Data Mining and Knowledge Discovery Proceedings of the 6th International Conference (PKDD-2002)"},{"key":"11","doi-asserted-by":"crossref","first-page":"164","DOI":"10.1007\/3-540-47952-X_18","article-title":"Visual based content understanding towards Web adaptation","author":"gu","year":"2002","journal-title":"Adaptive Hypermedia and Adaptive Web-Based Systems"},{"key":"12","doi-asserted-by":"crossref","DOI":"10.1007\/3-540-44794-6_18","article-title":"Using grammatical inference to automate information exraction from the Web","author":"hong","year":"2001","journal-title":"Principles of Data Mining and Knowledge Discovery"},{"key":"21","doi-asserted-by":"crossref","DOI":"10.1109\/ICDAR.2001.953909","article-title":"HTML page analysis based on visual cues","author":"yang","year":"2001","journal-title":"Proc Int Conf Document Analysis"},{"key":"3","article-title":"Extracting logical schema from the Web","author":"carchiolo","year":"2000","journal-title":"PRICAI Workshop on Text and Web Mining"},{"key":"20","article-title":"Toward a taxonomy of logical document structures","author":"summers","year":"1995","journal-title":"Electronic Publishing and the Information Superhighway Proceedings of the Dartmouth Institute for Advanced Graduate Studies (DAGS '95)"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/ICDSC.2001.918966"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1145\/271074.271078"},{"key":"10","article-title":"Information extraction from HTML: Application of a general learning approach","author":"freitag","year":"1998","journal-title":"Proceedings of the Fifteenth Conference on Artificial Intelligence AAAI-98"},{"key":"7","article-title":"A conceptual-modeling approach to extracting data from the web","author":"embley","year":"1998","journal-title":"Proceedings of the 17th International Conference on Conceptual Modeling (ER'98)"},{"journal-title":"Using HTML Formatting to Aid in Natural Language Processing on the World Wide Web","year":"1998","author":"dipasquo","key":"6"},{"key":"5","article-title":"ROADRUNNER: Towards automatic data extraction from large web sites","volume":"rt dia 64 2001","author":"crescenzi","year":"2001","journal-title":"Technical Report N RT-DIA-64-2001"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2002.994697"},{"key":"9","article-title":"Using grammatical inference to improve precision in information extraction","author":"freitag","year":"1997","journal-title":"Int Workshop Automata Induction Grammatical Inference Language Acquisition ICML 97"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1145\/304182.304223"}],"event":{"name":"Proceedings. 15th International Workshop on Database and Expert Systems Applications, 2004.","start":{"date-parts":[[2004,9,3]]},"location":"Zaragoza, Spain","end":{"date-parts":[[2004,9,3]]}},"container-title":["Proceedings. 15th International Workshop on Database and Expert Systems Applications, 2004."],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/9266\/29439\/01333471.pdf?arnumber=1333471","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,16]],"date-time":"2017-06-16T11:38:02Z","timestamp":1497613082000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/1333471\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2004]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/dexa.2004.1333471","relation":{},"subject":[],"published":{"date-parts":[[2004]]}}}