{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,4]],"date-time":"2025-03-04T05:44:37Z","timestamp":1741067077929,"version":"3.38.0"},"reference-count":17,"publisher":"Springer Science and Business Media LLC","issue":"5-6","license":[{"start":{"date-parts":[[2011,3,8]],"date-time":"2011-03-08T00:00:00Z","timestamp":1299542400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["World Wide Web"],"published-print":{"date-parts":[[2011,10]]},"DOI":"10.1007\/s11280-011-0124-6","type":"journal-article","created":{"date-parts":[[2011,3,7]],"date-time":"2011-03-07T08:04:16Z","timestamp":1299485056000},"page":"623-649","source":"Crossref","is-referenced-by-count":5,"title":["Indexing and querying segmented web pages: the BlockWeb Model"],"prefix":"10.1007","volume":"14","author":[{"given":"Emmanuel","family":"Bruno","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nicolas","family":"Faessel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Herv\u00e9","family":"Glotin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jacques","family":"Le Maitre","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michel","family":"Scholl","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2011,3,8]]},"reference":[{"key":"124_CR1","doi-asserted-by":"crossref","unstructured":"Bruno, E., Faessel, N., Glotin, H., Le Maitre, J., Scholl, M.: Indexing by permeability in block structured web pages. In: Proceedings of the 9th ACM Symposium on Document Engineering (DocEng 2009), pp. 70\u201373, (2009) (short paper)","DOI":"10.1145\/1600193.1600209"},{"key":"124_CR2","doi-asserted-by":"crossref","unstructured":"Bruno, E., Faessel, N., Le Maitre, J., Scholl, M.: Blockweb: an IR model for block structured web pages. In: Proc. of 7th Int. Workshop on Content Based Multimedia Indexing (CBMI 2009), pp. 219\u2013224. Chania, Crete, June 3\u20135 (2009)","DOI":"10.1109\/CBMI.2009.36"},{"key":"124_CR3","doi-asserted-by":"crossref","first-page":"952","DOI":"10.1145\/1027527.1027747","volume-title":"Proc. of the 12th ACM Int. Conf. on Multimedia, MULTIMEDIA \u201904","author":"D Cai","year":"2004","unstructured":"Cai, D., He, X., Li, Z., Ma, W.-Y., Wen, J.-R.: Hierarchical clustering of WWW image search results using visual, textual and link information. In: Proc. of the 12th ACM Int. Conf. on Multimedia, MULTIMEDIA \u201904, pp. 952\u2013959. ACM, New York, NY, USA (2004)"},{"key":"124_CR4","unstructured":"Cai, D., Yu, S., Wen, J.-R., Ma, W.-Y.: VIPS: A Vision-Based Page Segmentation Algorithm. Technical report, Microsoft Research (2003)"},{"key":"124_CR5","doi-asserted-by":"crossref","unstructured":"Cui, H., Wen, J.: Hierarchical indexing and flexible element retrieval for structured documents. In: Proc. of the 25th European Conf. on IR Research (ECIR 2003), pp. 73\u201387. Pisa, Italy (2003)","DOI":"10.1007\/3-540-36618-0_6"},{"issue":"9","key":"124_CR6","doi-asserted-by":"crossref","first-page":"1233","DOI":"10.1109\/TKDE.2005.138","volume":"17","author":"S Debnath","year":"2005","unstructured":"Debnath, S., Mitra, P., Pal, N., Giles, C.L.: Automatic identification of informative sections of web pages. IEEE Trans. Knowl. Data Eng. 17(9), 1233\u20131246 (2005)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"124_CR7","unstructured":"Duda, R.O., Hart, P.E., Stork, D.G.: Pattern Classification. Wiley-Interscience (2000)"},{"key":"124_CR8","doi-asserted-by":"crossref","unstructured":"Ha, J., Haralick, R.M., Phillips, I.T.: Recursive X-Y cut using bounding boxes of connected components. In: Proc. of the Third International Conference on Document Analysis and Recognition (ICDAR\u201995), vol. 2, pp. 952\u2013955. Washington, DC, USA (1995)","DOI":"10.1109\/ICDAR.1995.602059"},{"key":"124_CR9","doi-asserted-by":"crossref","unstructured":"Lin, S.-H., Ho, J.-M.: Discovering informative content blocks from Web documents. In: Proc. of the 8th ACM SIGKDD Int. Conf. on Knowledge Discovery and Data Mining, pp. 588\u2013593. Edmonton, Alberta, Canada (2002)","DOI":"10.1145\/775047.775134"},{"key":"124_CR10","unstructured":"Mo\u00ebllic, P.A., Fluhr, C.: ImagEval 2006 official campaign. CEA List (2006)"},{"issue":"11","key":"124_CR11","doi-asserted-by":"crossref","first-page":"613","DOI":"10.1145\/361219.361220","volume":"18","author":"G Salton","year":"1975","unstructured":"Salton, G., Wong, A., Yang, C.S.: A vector space model for automatic indexing. Commun. ACM 18(11), 613\u2013620 (1975)","journal-title":"Commun. ACM"},{"key":"124_CR12","doi-asserted-by":"crossref","unstructured":"Song, R., Liu, H., Wen, J.-R., Ma, W.-Y.: Learning block importance models for web pages. In: Proc. of the 13th Int. Conf. on World Wide Web (WWW 2004), pp. 203\u2013211. Manhattan, NY, USA (2004)","DOI":"10.1145\/988672.988700"},{"key":"124_CR13","doi-asserted-by":"crossref","unstructured":"Tollari, S., Glotin, H.: Web image retrieval on ImagEVAL: Evidences on visualness and textualness concept dependency in fusion model. In: Proc. of the ACM Int. Conf. on Image and Video Retrieval (CIVR 2007), pp. 65\u201372 (2007)","DOI":"10.1145\/1282280.1282289"},{"key":"124_CR14","doi-asserted-by":"crossref","unstructured":"Tollari, S., Glotin, H.: Learning optimal visual features from web sampling in online image retrieval. In: IEEE International Conference on Acoustics, Speech and Signal Processing. ICASSP 2008, pp. 1229\u20131232. IEEE (2008)","DOI":"10.1109\/ICASSP.2008.4517838"},{"issue":"2","key":"124_CR15","doi-asserted-by":"crossref","first-page":"157","DOI":"10.1007\/s11280-007-0021-1","volume":"10","author":"S Vadrevu","year":"2007","unstructured":"Vadrevu, S., Gelgi, F., Davulcu, H.: Information extraction from web pages using presentation regularities and domain knowledge. World Wide Web 10(2), 157\u2013179 (2007)","journal-title":"World Wide Web"},{"key":"124_CR16","doi-asserted-by":"crossref","unstructured":"Yi, L., Liu, B., Li, X.: Eliminating noisy information in web pages for data mining. In: Proc of the 9th ACM SIGKDD Int. Conf. on Knowledge Discovery and Data Mining, pp. 296\u2013305. Washington, DC, USA, ACM (2003)","DOI":"10.1145\/956755.956785"},{"key":"124_CR17","doi-asserted-by":"crossref","unstructured":"Zou, J., Le, D., Thoma, G.R.: Combining DOM tree and geometric layout analysis for online medical journal article segmentation. In: Proc. of the 6th ACM\/IEEE-CS Joint Conf. on Digital Libraries, pp. 119\u2013128. Chapel Hill, North Carolina, USA (2006)","DOI":"10.1145\/1141753.1141777"}],"container-title":["World Wide Web"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11280-011-0124-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11280-011-0124-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11280-011-0124-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,3]],"date-time":"2025-03-03T15:23:21Z","timestamp":1741015401000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11280-011-0124-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,3,8]]},"references-count":17,"journal-issue":{"issue":"5-6","published-print":{"date-parts":[[2011,10]]}},"alternative-id":["124"],"URL":"https:\/\/doi.org\/10.1007\/s11280-011-0124-6","relation":{},"ISSN":["1386-145X","1573-1413"],"issn-type":[{"type":"print","value":"1386-145X"},{"type":"electronic","value":"1573-1413"}],"subject":[],"published":{"date-parts":[[2011,3,8]]}}}