{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:32:55Z","timestamp":1750307575478,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":11,"publisher":"ACM","license":[{"start":{"date-parts":[[2009,12,3]],"date-time":"2009-12-03T00:00:00Z","timestamp":1259798400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2009,12,3]]},"DOI":"10.1145\/1667780.1667805","type":"proceedings-article","created":{"date-parts":[[2009,12,15]],"date-time":"2009-12-15T12:55:59Z","timestamp":1260881759000},"page":"126-131","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Development of a large-scale web crawler and search engine infrastructure"],"prefix":"10.1145","author":[{"given":"Susumu","family":"Akamine","sequence":"first","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yoshikiyo","family":"Kato","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Daisuke","family":"Kawahara","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Keiji","family":"Shinzato","sequence":"additional","affiliation":[{"name":"Kyoto University, Yoshida Honmachi, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kentaro","family":"Inui","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan and Nara Institute of Science and Technology, Ikoma, Nara, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sadao","family":"Kurohashi","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan and Kyoto University, Yoshida Honmachi, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yutaka","family":"Kidawara","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Soraku-gun, Kyoto, Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2009,12,3]]},"reference":[{"volume-title":"Corpus Workshop, http:\/\/webascorpus.sf.net\/WAC4\/","author":"Web","key":"e_1_3_2_1_1_1","unstructured":"Web as Corpus Workshop, http:\/\/webascorpus.sf.net\/WAC4\/ Web as Corpus Workshop, http:\/\/webascorpus.sf.net\/WAC4\/"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISUC.2008.79"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/1367497.1367556"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/1367497.1367557"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/1571941.1572041"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/297805.297827"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/792550.792553"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2004.10.007"},{"key":"e_1_3_2_1_9_1","first-page":"189","volume-title":"Proceedings of the Third International Joint Conference on Natural Language Processing","author":"Shinzato K.","year":"2008","unstructured":"K. Shinzato , T. Shibata , D. Kawahara , C. Hashimoto and S. Kurohashi : TSUBAKI: An Open Search Engine Infrastructure for Developing new Information Access Methodology , In Proceedings of the Third International Joint Conference on Natural Language Processing , pp. 189 -- 196 , 2008 . K. Shinzato, T. Shibata, D. Kawahara, C. Hashimoto and S. Kurohashi: TSUBAKI: An Open Search Engine Infrastructure for Developing new Information Access Methodology, In Proceedings of the Third International Joint Conference on Natural Language Processing, pp. 189--196, 2008."},{"key":"e_1_3_2_1_10_1","volume-title":"the Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC08)","author":"Shinzato K.","year":"2008","unstructured":"K. Shinzato , D. Kawahara , C. Hashimoto and S. Kurohashi : A Large-Scale Web Data Collection as a Natural Language Processing Infrastructure , In the Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC08) , 2008 . K. Shinzato, D. Kawahara, C. Hashimoto and S. Kurohashi: A Large-Scale Web Data Collection as a Natural Language Processing Infrastructure, In the Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC08), 2008."},{"key":"e_1_3_2_1_11_1","first-page":"787","volume-title":"the Proceedings of Third International Joint Conference on Natural Language Processing","author":"Shibata T.","year":"2008","unstructured":"T. Shibata , M. Odani , J. Harashima , T. Oonishi and S. Kurohashi : SYNGRAPH: A Flexible Matching Method based on Synonymous Expression Extraction from an Ordinary Dictionary and a Web Corpus , In the Proceedings of Third International Joint Conference on Natural Language Processing , pp. 787 -- 792 , 2008 . T. Shibata, M. Odani, J. Harashima, T. Oonishi and S. Kurohashi: SYNGRAPH: A Flexible Matching Method based on Synonymous Expression Extraction from an Ordinary Dictionary and a Web Corpus, In the Proceedings of Third International Joint Conference on Natural Language Processing, pp. 787--792, 2008."}],"event":{"name":"IUCS '09: 3rd International Universal Communication Symposium","sponsor":["NICT National Institute of Information and Communications Technology"],"location":"Tokyo Japan","acronym":"IUCS '09"},"container-title":["Proceedings of the 3rd International Universal Communication Symposium"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1667780.1667805","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1667780.1667805","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T12:41:08Z","timestamp":1750250468000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1667780.1667805"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,12,3]]},"references-count":11,"alternative-id":["10.1145\/1667780.1667805","10.1145\/1667780"],"URL":"https:\/\/doi.org\/10.1145\/1667780.1667805","relation":{},"subject":[],"published":{"date-parts":[[2009,12,3]]},"assertion":[{"value":"2009-12-03","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}