{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:23:40Z","timestamp":1750307020271,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":10,"publisher":"ACM","license":[{"start":{"date-parts":[[2012,6,13]],"date-time":"2012-06-13T00:00:00Z","timestamp":1339545600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2012,6,13]]},"DOI":"10.1145\/2254129.2254209","type":"proceedings-article","created":{"date-parts":[[2012,6,15]],"date-time":"2012-06-15T15:32:03Z","timestamp":1339774323000},"page":"1-4","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Automated internal web page clustering for improved data extraction"],"prefix":"10.1145","author":[{"given":"Cornelia","family":"Gy\u0151r\u00f6di","sequence":"first","affiliation":[{"name":"University of Oradea"}]},{"given":"Robert","family":"Gy\u0151r\u00f6di","sequence":"additional","affiliation":[{"name":"University of Oradea"}]},{"given":"Mihai","family":"Cornea","sequence":"additional","affiliation":[{"name":"University of Oradea"}]},{"given":"George","family":"Pecherle","sequence":"additional","affiliation":[{"name":"University of Oradea"}]}],"member":"320","published-online":{"date-parts":[[2012,6,13]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Efficient Implementation of the Levenshtein-Algorithm Fault-tolerant Search Technology Error-tolerant Search Technologies. DOI= http:\/\/www.levenshtein.net\/  Efficient Implementation of the Levenshtein-Algorithm Fault-tolerant Search Technology Error-tolerant Search Technologies. DOI= http:\/\/www.levenshtein.net\/"},{"volume-title":"Proceedings of the 27th VLDB Conference","year":"2001","author":"Crescenzi Valter","key":"e_1_3_2_1_2_1"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/1066677.1067065"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/775047.775134"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956826"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/360402.360406"},{"key":"e_1_3_2_1_7_1","unstructured":"Hotnews.ro Web Forum -- example of website with repetitive patterns http:\/\/forum.hotnews.ro\/  Hotnews.ro Web Forum -- example of website with repetitive patterns http:\/\/forum.hotnews.ro\/"},{"key":"e_1_3_2_1_8_1","unstructured":"Paul Ruhlen Husrev Tolga Ilhan V. Benjamin Livshits -- \"Unsupervised Web Page Clustering\" -- CS 224N Final Project -- Spring 2000 Stanford Univ. pag. 1--15.  Paul Ruhlen Husrev Tolga Ilhan V. Benjamin Livshits -- \"Unsupervised Web Page Clustering\" -- CS 224N Final Project -- Spring 2000 Stanford Univ. pag. 1--15."},{"key":"e_1_3_2_1_9_1","first-page":"9","article-title":"Web Page Analysis Based on HTML DOM and Its Usage for Forum Statistics, Alerts and Geo Targeted Data Retrieval","volume":"8","author":"Gyor\u00f6di Robert","year":"2010","journal-title":"Journal WSEAS TRANSACTIONS on COMPUTERS, Issue"},{"key":"e_1_3_2_1_10_1","unstructured":"Antonio LaTorre Jose M. Pena Victor Robles Maria S. Perez - \"A Survey in Web Page Clustering Techniques\"  Antonio LaTorre Jose M. Pena Victor Robles Maria S. Perez - \"A Survey in Web Page Clustering Techniques\""}],"event":{"name":"WIMS '12: 2nd International Conference on Web Intelligence, Mining and Semantics","sponsor":["UCV University of Craiova","WNRI Western Norway Research Institute"],"location":"Craiova Romania","acronym":"WIMS '12"},"container-title":["Proceedings of the 2nd International Conference on Web Intelligence, Mining and Semantics"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2254129.2254209","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2254129.2254209","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T08:49:12Z","timestamp":1750236552000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2254129.2254209"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,6,13]]},"references-count":10,"alternative-id":["10.1145\/2254129.2254209","10.1145\/2254129"],"URL":"https:\/\/doi.org\/10.1145\/2254129.2254209","relation":{},"subject":[],"published":{"date-parts":[[2012,6,13]]},"assertion":[{"value":"2012-06-13","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}