{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T17:10:01Z","timestamp":1749575401568,"version":"3.41.0"},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540440376"},{"type":"electronic","value":"9783540456810"}],"license":[{"start":{"date-parts":[[2002,1,1]],"date-time":"2002-01-01T00:00:00Z","timestamp":1009843200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2002,1,1]],"date-time":"2002-01-01T00:00:00Z","timestamp":1009843200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2002]]},"DOI":"10.1007\/3-540-45681-3_25","type":"book-chapter","created":{"date-parts":[[2007,10,19]],"date-time":"2007-10-19T11:03:25Z","timestamp":1192791805000},"page":"299-311","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["Information Extraction in Structured Documents Using Tree Automata Induction"],"prefix":"10.1007","author":[{"given":"Raymond","family":"Kosala","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jan","family":"Van den Bussche","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Maurice","family":"Bruynooghe","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hendrik","family":"Blockeel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2002,9,18]]},"reference":[{"issue":"4","key":"25_CR1","first-page":"319","volume":"2","author":"D. Angluin","year":"1988","unstructured":"D. Angluin. Queries and concept learning. Machine Learning, 2(4):319\u2013342, 1988.","journal-title":"Machine Learning"},{"key":"25_CR2","unstructured":"M. E. Cali. and R. J. Mooney. Relational learning of pattern-match rules for information extraction. In Proceedings of the Sixteenth National Conference on Artificial Intelligence and Eleventh Conference on Innovative Applications of Artificial Intelligence, pages 328\u2013334. AAAI Press \/ The MIT Press, 1999."},{"key":"25_CR3","doi-asserted-by":"crossref","unstructured":"B. Chidlovskii, J. Ragetli, and M. de Rijke. Wrapper generation via grammar induction. In 11th European Conference on Machine Learning, ECML\u201900, pages 96\u2013108, 2000.","DOI":"10.1007\/3-540-45164-1_11"},{"key":"25_CR4","unstructured":"W. W. Cohen. Recognizing structure in web pages using similarity queries. In Proceedings of the Sixteenth National Conference on Artificial Intelligence and Eleventh Conference on on Innovative Applications of Artificial Intelligence, pages 59\u201366, 1999."},{"key":"25_CR5","unstructured":"H. Comon, M. Dauchet, R. Gilleron, F. Jacquemard, D. Lugiez, S. Tison, and M. Tommasi. Tree Automata Techniques and Applications. Available on: http:\/\/www.grappa.univ-lille3.fr\/tata, 1999."},{"issue":"1","key":"25_CR6","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1145\/234173.234209","volume":"39","author":"J. Cowie","year":"1996","unstructured":"J. Cowie and W. Lehnert. Information extraction. Communications of the ACM, 39(1):80\u201391, 1996.","journal-title":"Communications of the ACM"},{"key":"25_CR7","unstructured":"D. Freitag. Using grammatical inference to improve precision in information extraction. In ICML-97 Workshop on Automata Induction, Grammatical Inference, and Language Acquisition, 1997."},{"key":"25_CR8","unstructured":"D. Freitag. Information extraction from HTML: Application of a general learning approach. In Proceedings of the Fifteenth Conference on Artificial Intelligence AAAI-98, pages 517\u2013523, 1998."},{"key":"25_CR9","unstructured":"D. Freitag and N. Kushmerick. Boosted wrapper induction. In Proceedings of the Seventeenth National Conference on Artificial Intelligence and Twelfth Innovative Applications of AI Conference, pages 577\u2013583. AAAI Press, 2000."},{"key":"25_CR10","unstructured":"D. Freitag and A. McCallum. Information extraction with HMMs and shrinkage. In AAAI-99 Workshop on Machine Learning for Information Extraction, 1999."},{"issue":"5","key":"25_CR11","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1016\/S0019-9958(67)91165-5","volume":"10","author":"E. M. Gold","year":"1967","unstructured":"E. M. Gold. Language identification in the limit. Information and Control, 10(5):447\u2013474, 1967.","journal-title":"Information and Control"},{"key":"25_CR12","doi-asserted-by":"crossref","unstructured":"G. Gottlob and K. Koch. Monadic datalog over trees and the expressive power of languages for web information extraction. In 21st ACM Symposium on Principles of Database Systems, June 2002. To appear.","DOI":"10.1145\/543616.543617"},{"key":"25_CR13","doi-asserted-by":"crossref","unstructured":"T.W. Hong and K. L. Clark. Using grammatical inference to automate information extraction from the web. In Principles of Data Mining and Knowledge Discovery, pages 216\u2013227, 2001.","DOI":"10.1007\/3-540-44794-6_18"},{"issue":"8","key":"25_CR14","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1016\/S0306-4379(98)00027-1","volume":"23","author":"C.-N. Hsu","year":"1998","unstructured":"C.-N. Hsu and M.-T. Dung. Generating finite-state transducers for semi-structured data extraction from the Web. Information Systems, 23(8):521\u2013538, 1998.","journal-title":"Information Systems"},{"key":"25_CR15","unstructured":"I. Muslea. Extraction patterns for information extraction tasks: A survey. In AAAI-99 Workshop on Machine Learning for Information Extraction, 1999."},{"key":"25_CR16","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1023\/A:1010022931168","volume":"4","author":"I. Muslea","year":"2001","unstructured":"I. Muslea, S. Minton, and C. Knoblock. Hierarchical wrapper induction for semistructured information sources. Journal of Autonomous Agents and Multi-Agent Systems, 4:93\u2013114, 2001.","journal-title":"Journal of Autonomous Agents and Multi-Agent Systems"},{"issue":"6","key":"25_CR17","doi-asserted-by":"publisher","first-page":"565","DOI":"10.1016\/S0019-9958(68)90999-6","volume":"13","author":"C. Pair","year":"1968","unstructured":"C. Pair and A. Quere. D\u00e9finition et etude des bilangages r\u00e9guliers. Information and Control, 13(6):565\u2013593, 1968.","journal-title":"Information and Control"},{"key":"25_CR18","doi-asserted-by":"crossref","unstructured":"J. Rico-Juan, J. Calera-Rubio, and R. Carrasco. Probabilistic k-testable treelanguages. In A. Oliveira, editor, Proceedings of 5th International Colloquium, ICGI 2000, Lisbon (Portugal), volume 1891 of Lecture Notes in Computer Science, pages 221\u2013228. Springer, 2000.","DOI":"10.1007\/978-3-540-45257-7_18"},{"issue":"1","key":"25_CR19","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1016\/0890-5401(92)90003-X","volume":"97","author":"Y. Sakakibara","year":"1992","unstructured":"Y. Sakakibara. Efficient learning of context-free grammars from positive structural examples. Information and Computation, 97(1):23\u201360, 1992.","journal-title":"Information and Computation"},{"issue":"1","key":"25_CR20","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/S0304-3975(97)00014-5","volume":"185","author":"Y. Sakakibara","year":"1997","unstructured":"Y. Sakakibara. Recent advances of grammatical inference. Theoretical Computer Science, 185(1):15\u201345, 1997.","journal-title":"Theoretical Computer Science"},{"key":"25_CR21","doi-asserted-by":"crossref","unstructured":"H. Sakamoto, H. Arimura, and S. Arikawa. Knowledge discovery from semistructured texts. In S. Arikawa and A. Shinohara, editors, Progress in Discovery Science \u2014 Final Report of the Japanese Discovery Science Project, volume 2281 of LNAI, pages 586\u2013599. Springer, 2002.","DOI":"10.1007\/3-540-45884-0_45"},{"issue":"1","key":"25_CR22","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1023\/A:1007562322031","volume":"34","author":"S. Soderland","year":"1999","unstructured":"S. Soderland. Learning information extraction rules for semi-structured and free text. Machine Learning, 34(1\u20133):233\u2013272, 1999.","journal-title":"Machine Learning"},{"key":"25_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/S0019-9958(75)90058-3","volume":"27","author":"M. Takahashi","year":"1975","unstructured":"M. Takahashi. Generalizations of regular sets and their application to a study of context-free languages. Information and Control, 27:1\u201336, 1975.","journal-title":"Information and Control"},{"issue":"11","key":"25_CR24","doi-asserted-by":"publisher","first-page":"1134","DOI":"10.1145\/1968.1972","volume":"27","author":"L. Valiant","year":"1984","unstructured":"L. Valiant. A theory of the learnable. Communications of the ACM, 27(11):1134\u20131142, 1984.","journal-title":"Communications of the ACM"},{"key":"25_CR25","unstructured":"Extensible markup language (XML) 1.0 (second edition). W3C Recommendation 6 October 2000. http:\/\/www.w3.org."}],"container-title":["Lecture Notes in Computer Science","Principles of Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-45681-3_25","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T16:36:13Z","timestamp":1749573373000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/3-540-45681-3_25"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2002]]},"ISBN":["9783540440376","9783540456810"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/3-540-45681-3_25","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2002]]},"assertion":[{"value":"18 September 2002","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}