{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T00:35:57Z","timestamp":1725496557235},"publisher-location":"Berlin, Heidelberg","reference-count":14,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540770916"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-77092-3_41","type":"book-chapter","created":{"date-parts":[[2007,11,24]],"date-time":"2007-11-24T02:59:32Z","timestamp":1195873172000},"page":"466-478","source":"Crossref","is-referenced-by-count":3,"title":["Finding and Extracting Data Records from Web Pages"],"prefix":"10.1007","author":[{"given":"Manuel","family":"\u00c1lvarez","sequence":"first","affiliation":[]},{"given":"Alberto","family":"Pan","sequence":"additional","affiliation":[]},{"given":"Juan","family":"Raposo","sequence":"additional","affiliation":[]},{"given":"Fernando","family":"Bellas","sequence":"additional","affiliation":[]},{"given":"Fidel","family":"Cacheda","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"41_CR1","doi-asserted-by":"crossref","unstructured":"Arasu, A., Garcia-Molina, H.: Extracting Structured Data from Web Pages. In: Proc. of the ACM SIGMOD Int. Conf. on Management of Data (2003)","DOI":"10.1145\/872757.872799"},{"key":"41_CR2","unstructured":"Baumgartner, R., Flesca, S., Gottlob, G.: Visual Web Information Extraction with Lixto. In: Proc. of Very Large DataBases (VLDB) (2001)"},{"key":"41_CR3","volume-title":"Mining the Web: Discovering Knowledge from Hypertext Data","author":"S. Chakrabarti","year":"2003","unstructured":"Chakrabarti, S.: Mining the Web: Discovering Knowledge from Hypertext Data. Morgan Kaufmann Publishers, San Francisco (2003)"},{"key":"41_CR4","doi-asserted-by":"crossref","unstructured":"Chang, C., Lui, S.: IEPAD: Information extraction based on pattern discovery. In: Proc. of 2001 Int. World Wide Web Conf., pp. 681\u2013688 (2001)","DOI":"10.1145\/371920.372182"},{"key":"41_CR5","doi-asserted-by":"crossref","unstructured":"Crescenzi, V., Mecca, G., Merialdo, P.: ROADRUNNER: Towards automatic data extraction from large web sites. In: Proc. of the 2001 Int. VLDB Conf., pp. 109\u2013118 (2001)","DOI":"10.1145\/564691.564778"},{"key":"41_CR6","volume-title":"New Indices for Text: Pat trees and Pat Arrays. Information Retrieval: Data Structures and Algorithms","author":"G.H. Gonnet","year":"1992","unstructured":"Gonnet, G.H., Baeza-Yates, R.A., Snider, T.: New Indices for Text: Pat trees and Pat Arrays. Information Retrieval: Data Structures and Algorithms. Prentice Hall, Englewood Cliffs (1992)"},{"issue":"2","key":"41_CR7","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/565117.565137","volume":"31","author":"A.H.F. Laender","year":"2002","unstructured":"Laender, A.H.F., Ribeiro-Neto, B.A., Soares da Silva, A., Teixeira, J.S.: A Brief Survey of Web Data Extraction Tools. ACM SIGMOD Record\u00a031(2), 84\u201393 (2002)","journal-title":"ACM SIGMOD Record"},{"key":"41_CR8","first-page":"707","volume":"10","author":"V.I. Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions, and reversals. Soviet Physics Doklady\u00a010, 707\u2013710 (1966)","journal-title":"Soviet Physics Doklady"},{"key":"41_CR9","doi-asserted-by":"crossref","unstructured":"Muslea, I., Minton, S., Knoblock, C.: Hierarchical Wrapper Induction for Semistructured Information Sources. Autonomous Agents and Multi-Agent Systems, 93\u2013114 (2001)","DOI":"10.1023\/A:1010022931168"},{"key":"41_CR10","doi-asserted-by":"crossref","unstructured":"Notredame, C.: Recent Progresses in Multiple Sequence Alignment: A Survey. Technical report, Information Genetique et (2002)","DOI":"10.1517\/14622416.3.1.131"},{"key":"41_CR11","doi-asserted-by":"crossref","unstructured":"Pan, A., et al.: Semi-Automatic Wrapper Generation for Commercial Web Sources. In: Proc. of IFIP WG8.1 Conf. on Engineering Inf. Systems in the Internet Context (EISIC) (2002)","DOI":"10.1007\/978-0-387-35614-3_16"},{"issue":"2","key":"41_CR12","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1016\/j.datak.2006.06.006","volume":"61","author":"J. Raposo","year":"2007","unstructured":"Raposo, J., Pan, A., \u00c1lvarez, M., Hidalgo, J.: Automatically Maintaining Wrappers for Web Sources. Data & Knowledge Engineering\u00a061(2), 331\u2013358 (2007)","journal-title":"Data & Knowledge Engineering"},{"key":"41_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1007\/11581062_24","volume-title":"Web Information Systems Engineering \u2013 WISE 2005","author":"Y. Zhai","year":"2005","unstructured":"Zhai, Y., Liu, B.: Extracting Web Data Using Instance-Based Learning. In: Ngu, A.H.H., Kitsuregawa, M., Neuhold, E.J., Chung, J.-Y., Sheng, Q.Z. (eds.) WISE 2005. LNCS, vol.\u00a03806, pp. 318\u2013331. Springer, Heidelberg (2005)"},{"issue":"12","key":"41_CR14","doi-asserted-by":"publisher","first-page":"1614","DOI":"10.1109\/TKDE.2006.197","volume":"18","author":"Y. Zhai","year":"2006","unstructured":"Zhai, Y., Liu, B.: Structured Data Extraction from the Web Based on Partial Tree Alignment. IEEE Trans. Knowl. Data Eng.\u00a018(12), 1614\u20131628 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."}],"container-title":["Lecture Notes in Computer Science","Embedded and Ubiquitous Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-77092-3_41.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,14]],"date-time":"2023-05-14T18:31:01Z","timestamp":1684089061000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-77092-3_41"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540770916"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-77092-3_41","relation":{},"subject":[]}}