{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,26]],"date-time":"2026-04-26T02:13:35Z","timestamp":1777169615288,"version":"3.51.4"},"reference-count":33,"publisher":"Elsevier BV","issue":"3","license":[{"start":{"date-parts":[[1999,11,1]],"date-time":"1999-11-01T00:00:00Z","timestamp":941414400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Data &amp; Knowledge Engineering"],"published-print":{"date-parts":[[1999,11]]},"DOI":"10.1016\/s0169-023x(99)00027-0","type":"journal-article","created":{"date-parts":[[2003,3,25]],"date-time":"2003-03-25T22:25:53Z","timestamp":1048631153000},"page":"227-251","source":"Crossref","is-referenced-by-count":198,"title":["Conceptual-model-based data extraction from multiple-record Web pages"],"prefix":"10.1016","volume":"31","author":[{"given":"D.W.","family":"Embley","sequence":"first","affiliation":[]},{"given":"D.M.","family":"Campbell","sequence":"additional","affiliation":[]},{"given":"Y.S.","family":"Jiang","sequence":"additional","affiliation":[]},{"given":"S.W.","family":"Liddle","sequence":"additional","affiliation":[]},{"given":"D.W.","family":"Lonsdale","sequence":"additional","affiliation":[]},{"given":"Y.-K.","family":"Ng","sequence":"additional","affiliation":[]},{"given":"R.D.","family":"Smith","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S0169-023X(99)00027-0_BIB1","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1007\/s007990050001","article-title":"Querying documents in object databases","volume":"1","author":"Abiteboul","year":"1997","journal-title":"International Journal on Digital Libraries"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB2","doi-asserted-by":"crossref","first-page":"66","DOI":"10.1007\/s007990050005","article-title":"The Lorel query language for semistructured data","volume":"1","author":"Abiteboul","year":"1997","journal-title":"International Journal on Digital Libraries"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB3","doi-asserted-by":"crossref","unstructured":"B. Adelberg, NoDoSE \u2013 a tool for semi-automatically extracting structured and semistructured data from text documents, in: Proceedings of the 1998 ACM SIGMOD International Conference on Management of Data, 1998, pp. 283\u2013294","DOI":"10.1145\/276304.276330"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB4","doi-asserted-by":"crossref","unstructured":"P. Apers, Identifying internet-related database research, in: Proceedings of the Second International East\u2013West Database Workshop, 1994, pp. 183\u2013193","DOI":"10.1007\/978-1-4471-3577-7_13"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB5","doi-asserted-by":"crossref","unstructured":"G. Arocena, A. Mendelzon, WebOQL: restructuring documents, databases and webs, in: Procedings of the 14th International Conference on Data Engineering, 1998","DOI":"10.1109\/ICDE.1998.655754"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB6","doi-asserted-by":"crossref","first-page":"8","DOI":"10.1145\/271074.271078","article-title":"Wrapper generation for semi-structured internet sources","volume":"26","author":"Ashish","year":"1997","journal-title":"SIGMOD Record"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB7","unstructured":"P. Atzeni, G. Mecca, P. Merialdo, To weave the Web, in: Proceedings of the 23rd International Conference on Very Large Data Bases, 1997, pp. 206\u2013215"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB8","doi-asserted-by":"crossref","unstructured":"P. Atzeni, G. Mecca, Cut and paste, in: Proceedings of the PODS'97, 1997, pp. 144\u2013153","DOI":"10.1145\/263661.263678"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB9","doi-asserted-by":"crossref","unstructured":"P. Buneman, S. Davidson, G. Hillebrand, D. Suciu, A query language and optimization techniques for unstructured data, in: Proceedings of the 1996 ACM SIGMOD International Conference on Management of Data, 1996, pp. 505\u2013516","DOI":"10.1145\/233269.233368"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB10","unstructured":"S. Chawathe, H. Garcia-Molina, J. Hammer, K. Ireland, Y. Papakonstantinou, J. Ullman, J. Widom, The TSIMMIS project: integration of heterogeneous information sources, IPSJ Conference, 1994, pp. 7\u201318"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB11","doi-asserted-by":"crossref","first-page":"80","DOI":"10.1145\/234173.234209","article-title":"Information extraction","volume":"39","author":"Cowie","year":"1996","journal-title":"Communications of the ACM"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB12","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1007\/s007990050002","article-title":"Structured maps: modeling explicit semantics over a universe of information","volume":"1","author":"Delcambre","year":"1997","journal-title":"International Journal on Digital Libraries"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB13","doi-asserted-by":"crossref","unstructured":"R. Doorenbos, O. Etzioni, D. Weld, A scalable comparison-shopping agent for the World-Wide Web, in: Proceedings of the First International Conference on Autonomous Agents, 1997, pp. 39\u201348","DOI":"10.1145\/267658.267666"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB14","doi-asserted-by":"crossref","unstructured":"D. Embley, Programming with data frames for everyday data items, in: Proceedings of the 1980 National Computer Conference, 1980, pp. 301\u2013305","DOI":"10.1145\/1500518.1500564"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB15","series-title":"Object-oriented Systems Analysis: A Model-Driven Approach","author":"Embley","year":"1992"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB16","doi-asserted-by":"crossref","unstructured":"D. Embley, D. Campbell, R. Smith, S. Liddle, Ontology-based extraction and structuring of information from data-rich unstructured documents, in: Proceedings of the Conference on Information and Knowledge Management (CIKM'98), 1998, pp. 52\u201359","DOI":"10.1145\/288627.288641"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB17","doi-asserted-by":"crossref","unstructured":"D. Embley, D. Campbell, R. Smith, S. Liddle, A Conceptual-modeling approach to extracting data from the Web, in: Proceedings of the 17th International Conference on Conceptual Modeling (ER'98), 1998, pp. 78\u201391","DOI":"10.1007\/978-3-540-49524-6_7"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB18","doi-asserted-by":"crossref","unstructured":"D. Embley, S. Jiang, Y.-K. Ng, Record-boundary discovery in Web documents, in: Proceedings of the 1999 ACM SIGMOD International Conference on Management of Data, 1999, pp. 467\u2013478","DOI":"10.1145\/304182.304223"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB19","doi-asserted-by":"crossref","unstructured":"D. Evans, C. Zhai, Noun-phrase analysis in unrestricted text for information retrieval, in: Proceedings of the 34th Annual Meeting of the Association for Computational Linguistics, 1996, pp. 17\u201324","DOI":"10.3115\/981863.981866"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB20","doi-asserted-by":"crossref","unstructured":"S. Flank, A layered approach to NLP-based information retrieval, in: Proceedings of the COLING'98, 1998, pp. 397\u2013403","DOI":"10.3115\/980451.980913"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB21","series-title":"Information Retrieval: Data Structures & Algorithms","author":"Frakes","year":"1992"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB22","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1145\/271074.271093","article-title":"Virtual database technology","volume":"26","author":"Gupta","year":"1997","journal-title":"SIGMOD Record"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB23","unstructured":"J. Hammer, H. Garcia-Molina, J. Cho, R. Aranha, A. Crespo, Extracting semistructured information from the Web, in: Proceedings of the Workshop on Management of Semistructured Data, 1997"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB24","doi-asserted-by":"crossref","first-page":"305","DOI":"10.1017\/S1351324997001563","article-title":"Regular expressions for language engineering","volume":"2\/4","author":"Karttunen","year":"1996","journal-title":"Natural Language Engineering special issue: ECAI'96 workshop on extended finite state models of language"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB25","unstructured":"D. Konopnicki, O. Shmueli, W3QS: a query system for the world-wide Web, in: Proceedings of the 21st International Conference on Very Large Data Bases, 1995, pp. 54\u201365"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB26","unstructured":"N. Kushmerick, D. Weld, R. Doorenbos, Wrapper induction for information extraction, in: Proceedings of the 1997 International Joint Conference on Artificial Intelligence, 1997, pp. 729\u2013735"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB27","doi-asserted-by":"crossref","unstructured":"L. Lakshmanan, F. Sadri, I. Subramanian, A declarative language for querying and restructuring the Web, in: Proceedings of the Sixth international workshop on research issues in data engineering (RIDE'96), 1996","DOI":"10.1109\/RIDE.1996.492238"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB28","doi-asserted-by":"crossref","unstructured":"S. Liddle, D. Embley, S. Woodfield, Unifying modeling and programming through an active, object-oriented, model-equivalent programming language, in: Proceedings of the 14th International Conference on Object-Oriented and Entity-Relationship Modeling, 1995, pp. 55\u201364","DOI":"10.1007\/BFb0020520"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB29","unstructured":"G.F. Luger, W.A. Stubblefield, Artificial Intelligence: Structures and Strategies for Complex Problem Solving, 3rd ed., Addison-Wesley, Longman, Reading, MA, 1998"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB30","doi-asserted-by":"crossref","unstructured":"A. Mendelzon, G. Mihaila, T. Milo, Querying the World Wide Web, in: Proceedings of the First International Conference on Parallel and Distributed Information Systems (PDIS'96), 1996","DOI":"10.1109\/PDIS.1996.568671"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB31","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1007\/s007990050004","article-title":"querying the world wide web","volume":"1","author":"Mendelzon","year":"1997","journal-title":"International Journal on Digital Libraries"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB32","unstructured":"D. Smith, M. Lopez, Information extraction for semi-structured documents, in: Proceedings of the Workshop on Management of Semistructured Data, 1997"},{"key":"10.1016\/S0169-023X(99)00027-0_BIB33","unstructured":"S. Soderland, Learning to extract text-based information from the World Wide Web, in: Proceedings of the Third International Conference on Knowledge Discovery and Data Mining, 1997, pp. 251\u2013254"}],"container-title":["Data &amp; Knowledge Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0169023X99000270?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0169023X99000270?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2020,1,15]],"date-time":"2020-01-15T01:29:49Z","timestamp":1579051789000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0169023X99000270"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1999,11]]},"references-count":33,"journal-issue":{"issue":"3","published-print":{"date-parts":[[1999,11]]}},"alternative-id":["S0169023X99000270"],"URL":"https:\/\/doi.org\/10.1016\/s0169-023x(99)00027-0","relation":{},"ISSN":["0169-023X"],"issn-type":[{"value":"0169-023X","type":"print"}],"subject":[],"published":{"date-parts":[[1999,11]]}}}