{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T23:56:24Z","timestamp":1725494184662},"publisher-location":"Berlin, Heidelberg","reference-count":14,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540769927"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-76993-4_18","type":"book-chapter","created":{"date-parts":[[2007,11,6]],"date-time":"2007-11-06T11:30:45Z","timestamp":1194348645000},"page":"212-224","source":"Crossref","is-referenced-by-count":5,"title":["Using Clustering and Edit Distance Techniques for Automatic Web Data Extraction"],"prefix":"10.1007","author":[{"given":"Manuel","family":"\u00c1lvarez","sequence":"first","affiliation":[]},{"given":"Alberto","family":"Pan","sequence":"additional","affiliation":[]},{"given":"Juan","family":"Raposo","sequence":"additional","affiliation":[]},{"given":"Fernando","family":"Bellas","sequence":"additional","affiliation":[]},{"given":"Fidel","family":"Cacheda","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"18_CR1","doi-asserted-by":"crossref","unstructured":"Arasu, A., Garcia-Molina, H.: Extracting Structured Data from Web Pages. In: Proc. of the ACM SIGMOD Int. Conf. on Management of Data (2003)","DOI":"10.1145\/872757.872799"},{"key":"18_CR2","unstructured":"Baumgartner, R., Flesca, S., Gottlob, G.: Visual Web Information Extraction with Lixto. In: VLDB. Proc. of Very Large DataBases (2001)"},{"key":"18_CR3","volume-title":"Mining the Web: Discovering Knowledge from Hypertext Data","author":"S. Chakrabarti","year":"2003","unstructured":"Chakrabarti, S.: Mining the Web: Discovering Knowledge from Hypertext Data. Morgan Kaufmann Publishers, San Francisco (2003)"},{"key":"18_CR4","doi-asserted-by":"crossref","unstructured":"Chang, C., Lui, S.: IEPAD: Information extraction based on pattern discovery. In: Proc. of 2001 Int. World Wide Web Conf., pp. 681\u2013688 (2001)","DOI":"10.1145\/371920.372182"},{"key":"18_CR5","doi-asserted-by":"crossref","unstructured":"Crescenzi, V., Mecca, G., Merialdo, P.: ROADRUNNER: Towards automatic data extraction from large web sites. In: Proc. of the 2001 Int. VLDB Conf., pp. 109\u2013118 (2001)","DOI":"10.1145\/564691.564778"},{"key":"18_CR6","volume-title":"Information Retrieval: Data Structures and Algorithms","author":"G.H. Gonnet","year":"1992","unstructured":"Gonnet, G.H., Baeza-Yates, R.A., Snider, T.: New Indices for Text: Pat trees and Pat Arrays. In: Information Retrieval: Data Structures and Algorithms, Prentice Hall, Englewood Cliffs (1992)"},{"issue":"2","key":"18_CR7","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/565117.565137","volume":"31","author":"A.H.F. Laender","year":"2002","unstructured":"Laender, A.H.F., Ribeiro-Neto, B.A., da Silva, A.S., Teixeira, J.S.: A Brief Survey of Web Data Extraction Tools. ACM SIGMOD Record\u00a031(2), 84\u201393 (2002)","journal-title":"ACM SIGMOD Record"},{"key":"18_CR8","first-page":"707","volume":"10","author":"V.I. Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions, and reversals. Soviet Physics Doklady\u00a010, 707\u2013710 (1966)","journal-title":"Soviet Physics Doklady"},{"key":"18_CR9","doi-asserted-by":"crossref","unstructured":"Muslea, I., Minton, S., Knoblock, C.: Hierarchical Wrapper Induction for Semistructured Information Sources. In: Autonomous Agents and Multi-Agent Systems, pp. 93\u2013114 (2001)","DOI":"10.1023\/A:1010022931168"},{"key":"18_CR10","doi-asserted-by":"crossref","unstructured":"Notredame, C.: Recent Progresses in Multiple Sequence Alignment: A Survey. Technical report, Information Genetique et. (2002)","DOI":"10.1517\/14622416.3.1.131"},{"key":"18_CR11","doi-asserted-by":"crossref","unstructured":"Pan, A., et al.: Semi-Automatic Wrapper Generation for Commercial Web Sources. In: EISIC. Proc. of IFIP WG8.1 Conf. on Engineering Inf. Systems in the Internet Context (2002)","DOI":"10.1007\/978-0-387-35614-3_16"},{"issue":"2","key":"18_CR12","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1016\/j.datak.2006.06.006","volume":"61","author":"J. Raposo","year":"2007","unstructured":"Raposo, J., Pan, A., \u00c1lvarez, M., Hidalgo, J.: Automatically Maintaining Wrappers for Web Sources. Data & Knowledge Engineering\u00a061(2), 331\u2013358 (2007)","journal-title":"Data & Knowledge Engineering"},{"key":"18_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1007\/11581062_24","volume-title":"Web Information Systems Engineering \u2013 WISE 2005","author":"Y. Zhai","year":"2005","unstructured":"Zhai, Y., Liu, B.: Extracting Web Data Using Instance-Based Learning. In: Ngu, A.H.H., Kitsuregawa, M., Neuhold, E.J., Chung, J.-Y., Sheng, Q.Z. (eds.) WISE 2005. LNCS, vol.\u00a03806, pp. 318\u2013331. Springer, Heidelberg (2005)"},{"issue":"12","key":"18_CR14","doi-asserted-by":"publisher","first-page":"1614","DOI":"10.1109\/TKDE.2006.197","volume":"18","author":"Y. Zhai","year":"2006","unstructured":"Zhai, Y., Liu, B.: Structured Data Extraction from the Web Based on Partial Tree Alignment. IEEE Trans. Knowl. Data Eng.\u00a018(12), 1614\u20131628 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."}],"container-title":["Lecture Notes in Computer Science","Web Information Systems Engineering \u2013 WISE 2007"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-76993-4_18.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,14]],"date-time":"2023-05-14T16:39:21Z","timestamp":1684082361000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-76993-4_18"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540769927"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-76993-4_18","relation":{},"subject":[]}}