{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T11:02:36Z","timestamp":1725793356397},"publisher-location":"Cham","reference-count":16,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319066042"},{"type":"electronic","value":"9783319066059"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-06605-9_47","type":"book-chapter","created":{"date-parts":[[2014,5,7]],"date-time":"2014-05-07T21:56:51Z","timestamp":1399499811000},"page":"572-583","source":"Crossref","is-referenced-by-count":1,"title":["Unsupervised Analysis of Web Page Semantic Structures by Hierarchical Bayesian Modeling"],"prefix":"10.1007","author":[{"given":"Minoru","family":"Yoshida","sequence":"first","affiliation":[]},{"given":"Kazuyuki","family":"Matsumoto","sequence":"additional","affiliation":[]},{"given":"Kenji","family":"Kita","sequence":"additional","affiliation":[]},{"given":"Hiroshi","family":"Nakagawa","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"47_CR1","doi-asserted-by":"crossref","unstructured":"Miao, G., Tatemura, J., Hsiung, W.P., Sawires, A., Moser, L.E.: Extracting data records from the web using tag path clustering. In: Proceedings of WWW 2009, pp. 981\u2013990 (2009)","DOI":"10.1145\/1526709.1526841"},{"key":"47_CR2","doi-asserted-by":"crossref","unstructured":"Liu, B., Grossman, R.L., Zhai, Y.: Mining data records in web pages. In: Proceedings of KDD 2003, pp. 601\u2013606 (2003)","DOI":"10.1145\/956804.956826"},{"key":"47_CR3","unstructured":"Chung, C.Y., Gertz, M., Sundaresan, N.: Reverse engineering for web data: From visual to semantic structures. In: ICDE (2002)"},{"key":"47_CR4","unstructured":"Yang, Y., Zhang, H.: HTML page analysis based on visual cues. In: Proceedings of the Sixth International Conference on Document Analysis and Recognition, ICDAR 2001 (2001)"},{"key":"47_CR5","unstructured":"Nanno, T., Saito, S., Okumura, M.: Structuring web pages based on repetition of elements. In: Proceedings of the Second International Workshop on Web Document Analysis, WDA 2003 (2003)"},{"key":"47_CR6","unstructured":"Mukherjee, S., Yang, G., Tan, W., Ramakrishnan, I.: Automatic discovery of semantic structures in HTML documents. In: Proceedings of the Seventh International Conference on Document Analysis and Recognition, ICDAR 2003 (2003)"},{"key":"47_CR7","unstructured":"Crescenzi, V., Mecca, G., Merialdo, P.: ROADRUNNER: Towards automatic data extraction from large web sites. In: Proceedings of the 27th International Conference on Very Large Data Bases (VLDB 2001), pp. 109\u2013118 (2001)"},{"key":"47_CR8","doi-asserted-by":"crossref","unstructured":"Chang, C.H., Lui, S.C.: IEPAD: Information extraction based on pattern discovery. In: Proceedings of the 10th International WWW Conference (WWW 2001), pp. 681\u2013688 (2001)","DOI":"10.1145\/371920.372182"},{"key":"47_CR9","doi-asserted-by":"crossref","unstructured":"Nguyen, C.K., Likforman-Sulem, L., Moissinac, J.C., Faure, C., Lardon, J.: Web document analysis based on visual segmentation and page rendering. In: Proceedings of International Workshop on Document Analysis Systems (DAS 2012), pp. 354\u2013358. IEEE Computer Society (2012)","DOI":"10.1109\/DAS.2012.95"},{"key":"47_CR10","doi-asserted-by":"crossref","unstructured":"Hu, Y., Xin, G., Song, R., Hu, G., Shi, S., Cao, Y., Li, H.: Title extraction from bodies of HTML documents and its application to web page retrieval. In: Proceedings of the 28th Annual International ACM SIGIR Conference (SIGIR 2005), pp. 250\u2013257 (2005)","DOI":"10.1145\/1076034.1076079"},{"key":"47_CR11","doi-asserted-by":"crossref","unstructured":"Tatsumi, Y., Asahi, T.: Analyzing web page headings considering various presentation. In: Proceedings of the 14th International Conference on World Wide Web Special Interest Tracks and Posters, pp. 956\u2013957 (2005)","DOI":"10.1145\/1062745.1062816"},{"key":"47_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"406","DOI":"10.1007\/3-540-36901-5_42","volume-title":"Web Technologies and Applications","author":"D. Cai","year":"2003","unstructured":"Cai, D., Yu, S., Wen, J.R., Ma, W.Y.: Extracting content structure for web pages based on visual representation. In: Zhou, X., Zhang, Y., Orlowska, M.E. (eds.) APWeb 2003. LNCS, vol.\u00a02642, pp. 406\u2013417. Springer, Heidelberg (2003)"},{"issue":"2","key":"47_CR13","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1145\/1964897.1964904","volume":"12","author":"T. Weninger","year":"2010","unstructured":"Weninger, T., Fumarola, F., Barber, R., Han, J., Malerba, D.: Unexpected results in automatic list extraction on the web. ACM SIGKDD Explorations Newsletter\u00a012(2), 26\u201330 (2010)","journal-title":"ACM SIGKDD Explorations Newsletter"},{"issue":"476","key":"47_CR14","doi-asserted-by":"publisher","first-page":"1566","DOI":"10.1198\/016214506000000302","volume":"101","author":"Y.W. Teh","year":"2006","unstructured":"Teh, Y.W., Jordan, M.I., Beal, M.J., Blei, D.M.: Hierarchical dirichlet processes. Journal of the American Statistical Association\u00a0101(476), 1566\u20131581 (2006)","journal-title":"Journal of the American Statistical Association"},{"key":"47_CR15","doi-asserted-by":"crossref","unstructured":"Artiles, J., Gonzalo, J., Sekine, S.: The semeval-2007 weps evaluation: Establishing a benchmark for the web people search task. In: Proceedings of the Workshop on Semantic Evaluation (SemEval 2007) at ACL 2007, pp. 64\u201369 (2007)","DOI":"10.3115\/1621474.1621486"},{"key":"47_CR16","unstructured":"Artiles, J., Gonzalo, J., Sekine, S.: Weps 2 evaluation campaign: overview of the web people search clustering task. In: Proceedinsg of the 2nd Web People Search Evaluation Workshop (WePS 2009), 18th WWW Conference (2009)"}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-06605-9_47","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,26]],"date-time":"2019-05-26T15:50:18Z","timestamp":1558885818000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-06605-9_47"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319066042","9783319066059"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-06605-9_47","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}