{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:44:19Z","timestamp":1750308259883,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":11,"publisher":"ACM","license":[{"start":{"date-parts":[[2004,11,12]],"date-time":"2004-11-12T00:00:00Z","timestamp":1100217600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2004,11,12]]},"DOI":"10.1145\/1031453.1031457","type":"proceedings-article","created":{"date-parts":[[2005,1,30]],"date-time":"2005-01-30T17:58:48Z","timestamp":1107107928000},"page":"9-15","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":9,"title":["SmartCrawl"],"prefix":"10.1145","author":[{"given":"Augusto de Carvalho","family":"Fontes","sequence":"first","affiliation":[{"name":"Universidade Tiradentes"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"F\u00e1bio Soares","family":"Silva","sequence":"additional","affiliation":[{"name":"Universidade Tiradentes"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2004,11,12]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"The Deep Web: Surfacing Hidden Value","author":"Bergman M. K.","year":"2001","unstructured":"M. K. Bergman . The Deep Web: Surfacing Hidden Value . 2001 . M. K. Bergman. The Deep Web: Surfacing Hidden Value. 2001."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0169-7552(98)00110-X"},{"key":"e_1_3_2_1_3_1","volume-title":"Cyberneko html parser","author":"Clark A.","year":"2004","unstructured":"A. Clark . Cyberneko html parser , 2004 . http:\/\/www.apache.org\/ andyc\/. A. Clark. Cyberneko html parser, 2004. http:\/\/www.apache.org\/ andyc\/."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/584931.584946"},{"key":"e_1_3_2_1_5_1","first-page":"38","volume-title":"Proceedings of the Workshop on Conceptual Modeling Approaches for e-Business","author":"Liddle S.","year":"2002","unstructured":"S. Liddle , D. Embley , D. Scott , and S. H. Yau . Extracting data behind web forms . In Proceedings of the Workshop on Conceptual Modeling Approaches for e-Business , pages 38 -- 49 , 2002 . S. Liddle, D. Embley, D. Scott, and S. H. Yau. Extracting data behind web forms. In Proceedings of the Workshop on Conceptual Modeling Approaches for e-Business, pages 38--49, 2002."},{"key":"e_1_3_2_1_6_1","first-page":"332","volume-title":"Proceedings of the The International Conference on Information Technology: Coding and Computing (ITCC'02)","author":"Lin K.-I.","year":"2002","unstructured":"K.-I. Lin and H. Chen . Automatic information discovery from the invisible web . In Proceedings of the The International Conference on Information Technology: Coding and Computing (ITCC'02) , pages 332 -- 337 , 2002 . K.-I. Lin and H. Chen. Automatic information discovery from the invisible web. In Proceedings of the The International Conference on Information Technology: Coding and Computing (ITCC'02), pages 332--337, 2002."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/645927.672025"},{"key":"e_1_3_2_1_8_1","volume-title":"Checklist for search robot crawling and indexing","author":"Rappoport A.","year":"2004","unstructured":"A. Rappoport . Checklist for search robot crawling and indexing , 2004 . http:\/\/www.searchtools.com\/robots\/robot-checklist.html. A. Rappoport. Checklist for search robot crawling and indexing, 2004. http:\/\/www.searchtools.com\/robots\/robot-checklist.html."},{"key":"e_1_3_2_1_9_1","volume-title":"The Invisible Web: Uncovering Information Sources Search Engines Can't See","author":"Sherman C.","year":"2001","unstructured":"C. Sherman and G. Price . The Invisible Web: Uncovering Information Sources Search Engines Can't See . CyberAge Books , 2001 . C. Sherman and G. Price. The Invisible Web: Uncovering Information Sources Search Engines Can't See. CyberAge Books, 2001."},{"key":"e_1_3_2_1_10_1","first-page":"357","volume-title":"Proceedings of the 18th International Conference on Data Engineering","author":"Shkapenyuk V.","unstructured":"V. Shkapenyuk and T. Suel . Design and implementation of a high-performance distributed web crawler . In Proceedings of the 18th International Conference on Data Engineering , pages 357 -- 368 . V. Shkapenyuk and T. Suel. Design and implementation of a high-performance distributed web crawler. In Proceedings of the 18th International Conference on Data Engineering, pages 357--368."},{"key":"e_1_3_2_1_11_1","volume-title":"Study Finds","author":"Sullivan D.","year":"2001","unstructured":"D. Sullivan . Internet Top Information Resource , Study Finds , 2001 . D. Sullivan. Internet Top Information Resource, Study Finds, 2001."}],"event":{"name":"CIKM04: Conference on Information and Knowledge Management","sponsor":["ACM Association for Computing Machinery","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Washington DC USA","acronym":"CIKM04"},"container-title":["Proceedings of the 6th annual ACM international workshop on Web information and data management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1031453.1031457","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1031453.1031457","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T17:23:46Z","timestamp":1750267426000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1031453.1031457"}},"subtitle":["a new strategy for the exploration of the hidden web"],"short-title":[],"issued":{"date-parts":[[2004,11,12]]},"references-count":11,"alternative-id":["10.1145\/1031453.1031457","10.1145\/1031453"],"URL":"https:\/\/doi.org\/10.1145\/1031453.1031457","relation":{},"subject":[],"published":{"date-parts":[[2004,11,12]]},"assertion":[{"value":"2004-11-12","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}