{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T13:37:12Z","timestamp":1773409032707,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":14,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783642322808","type":"print"},{"value":"9783642322815","type":"electronic"}],"license":[{"start":{"date-parts":[[2012,1,1]],"date-time":"2012-01-01T00:00:00Z","timestamp":1325376000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-32281-5_41","type":"book-chapter","created":{"date-parts":[[2012,8,13]],"date-time":"2012-08-13T08:59:36Z","timestamp":1344848376000},"page":"419-433","source":"Crossref","is-referenced-by-count":2,"title":["WYSIWYE: An Algebra for Expressing Spatial and Textual Rules for Information Extraction"],"prefix":"10.1007","author":[{"given":"Vijil","family":"Chenthamarakshan","sequence":"first","affiliation":[]},{"given":"Ramakrishna","family":"Varadarajan","sequence":"additional","affiliation":[]},{"given":"Prasad M.","family":"Deshpande","sequence":"additional","affiliation":[]},{"given":"Raghuram","family":"Krishnapuram","sequence":"additional","affiliation":[]},{"given":"Knut","family":"Stolze","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"41_CR1","unstructured":"Cai, D., Yu, S., Wen, J.R., Ma, W.Y.: Vips: a vision-based page segmentation algorithm. Technical report, Microsoft Research (2003)"},{"key":"41_CR2","doi-asserted-by":"crossref","unstructured":"Gatterbauer, W., Bohunsky, P., Herzog, M., Kr\u00fcpl, B., Pollak, B.: Towards domain-independent information extraction from web tables. In: WWW 2007, Banff, Alberta, Canada, pp. 71\u201380. ACM (2007)","DOI":"10.1145\/1242572.1242583"},{"key":"41_CR3","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1145\/1007568.1007584","volume-title":"SIGMOD 2004","author":"K. Lerman","year":"2004","unstructured":"Lerman, K., Getoor, L., Minton, S., Knoblock, C.: Using the structure of web sites for automatic segmentation of tables. In: SIGMOD 2004, pp. 119\u2013130. ACM, New York (2004)"},{"key":"41_CR4","doi-asserted-by":"crossref","unstructured":"Kr\u00fcpl, B., Herzog, M., Gatterbauer, W.: Using visual cues for extraction of tabular data from arbitrary html documents. In: WWW 2005, pp. 1000\u20131001 (2005)","DOI":"10.1145\/1062745.1062838"},{"key":"41_CR5","doi-asserted-by":"crossref","unstructured":"Reiss, F., Raghavan, S., Krishnamurthy, R., Zhu, H., Vaithyanathan, S.: An algebraic approach to rule-based information extraction. In: ICDE 2008, pp. 933\u2013942 (2008)","DOI":"10.1109\/ICDE.2008.4497502"},{"key":"41_CR6","unstructured":"Shen, W., Doan, A., Naughton, J.F., Ramakrishnan, R.: Declarative information extraction using datalog with embedded extraction predicates. In: VLDB 2007, pp. 1033\u20131044. VLDB Endowment, Vienna (2007)"},{"key":"41_CR7","doi-asserted-by":"crossref","unstructured":"Appelt, D.E., Onyshkevych, B.: The common pattern specification language. In: Proceedings of a Workshop on Held at Baltimore, Maryland, Morristown, NJ, USA, pp. 23\u201330. Association for Computational Linguistics (1996)","DOI":"10.3115\/1119089.1119095"},{"key":"41_CR8","doi-asserted-by":"crossref","unstructured":"Sarawagi, S.: Information extraction. FnT Databases\u00a01(3) (2008)","DOI":"10.1561\/1900000003"},{"key":"41_CR9","doi-asserted-by":"crossref","unstructured":"Cunningham, H., Wilks, Y., Gaizauskas, R.J.: Gate - a general architecture for text engineering (1996)","DOI":"10.3115\/993268.993365"},{"issue":"3-4","key":"41_CR10","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1017\/S1351324904003523","volume":"10","author":"D. Ferrucci","year":"2004","unstructured":"Ferrucci, D., Lally, A.: Uima: an architectural approach to unstructured information processing in the corporate research environment. Nat. Lang. Eng.\u00a010(3-4), 327\u2013348 (2004)","journal-title":"Nat. Lang. Eng."},{"key":"41_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1007\/3-540-47952-X_18","volume-title":"Adaptive Hypermedia and Adaptive Web-Based Systems","author":"X.-D. Gu","year":"2002","unstructured":"Gu, X.-D., Chen, J., Ma, W.-Y., Chen, G.-L.: Visual Based Content Understanding towards Web Adaptation. In: De Bra, P., Brusilovsky, P., Conejo, R. (eds.) AH 2002. LNCS, vol.\u00a02347, pp. 164\u2013173. Springer, Heidelberg (2002)"},{"key":"41_CR12","first-page":"250","volume-title":"ICDM 2002","author":"M. Kovacevic","year":"2002","unstructured":"Kovacevic, M., Diligenti, M., Gori, M., Milutinovic, V.: Recognition of common areas in a web page using visual information: a possible application in a page classification. In: ICDM 2002, p. 250. IEEE Computer Society, Washington, DC (2002)"},{"key":"41_CR13","doi-asserted-by":"crossref","unstructured":"Arasu, A., Garcia-Molina, H.: Extracting structured data from web pages. In: SIGMOD Conference, pp. 337\u2013348 (2003)","DOI":"10.1145\/872757.872799"},{"key":"41_CR14","doi-asserted-by":"crossref","unstructured":"Ramakrishnan, G., Balakrishnan, S., Joshi, S.: Entity annotation based on inverse index operations. In: EMNLP 2006, pp. 492\u2013500. Association for Computational Linguistics, Sydney (2006)","DOI":"10.3115\/1610075.1610143"}],"container-title":["Lecture Notes in Computer Science","Web-Age Information Management"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-32281-5_41","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,19]],"date-time":"2019-05-19T21:01:15Z","timestamp":1558299675000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-32281-5_41"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642322808","9783642322815"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-32281-5_41","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012]]}}}