{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:41:54Z","timestamp":1750308114395,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":34,"publisher":"ACM","license":[{"start":{"date-parts":[[2005,6,20]],"date-time":"2005-06-20T00:00:00Z","timestamp":1119225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2005,6,20]]},"DOI":"10.1145\/1088149.1088162","type":"proceedings-article","created":{"date-parts":[[2005,11,7]],"date-time":"2005-11-07T17:34:39Z","timestamp":1131384879000},"page":"91-100","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Design of a next generation sampling service for large scale data analysis applications"],"prefix":"10.1145","author":[{"given":"H.","family":"Wang","sequence":"first","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"S.","family":"Parthasarathy","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"A.","family":"Ghoting","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"S.","family":"Tatikonda","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"G.","family":"Buehrer","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"T.","family":"Kurc","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]},{"given":"J.","family":"Saltz","sequence":"additional","affiliation":[{"name":"The Ohio State University, Columbus, OH"}]}],"member":"320","published-online":{"date-parts":[[2005,6,20]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/543613.543615"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/602421.602425"},{"key":"e_1_3_2_1_3_1","volume-title":"Proceedings of the Annual Linux Showcase and Conference","author":"Carns P.","year":"2000","unstructured":"P. Carns , W. Ligon , R. Ross , and R. Thakur . Pvfs: A parallel file system for linux clusters . In Proceedings of the Annual Linux Showcase and Conference , 2000 .]] P. Carns, W. Ligon, R. Ross, and R. Thakur. Pvfs: A parallel file system for linux clusters. In Proceedings of the Annual Linux Showcase and Conference, 2000.]]"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.5555\/645919.672655"},{"key":"e_1_3_2_1_5_1","volume-title":"The Data Grid: Towards an Architecture For the Distributed Management and Analysis of Large Scientific Datasets","author":"Chervenak A.","year":"2001","unstructured":"A. Chervenak , I. Foster , C. Kesselman , C. Salisbury , and S. Tuecke . The Data Grid: Towards an Architecture For the Distributed Management and Analysis of Large Scientific Datasets , 2001 .]] A. Chervenak, I. Foster, C. Kesselman, C. Salisbury, and S. Tuecke. The Data Grid: Towards an Architecture For the Distributed Management and Analysis of Large Scientific Datasets, 2001.]]"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/233557.233558"},{"key":"e_1_3_2_1_7_1","volume-title":"Introduction to Algorithms","author":"Cormen Thomas H.","year":"1990","unstructured":"Thomas H. Cormen , Charles E. Leiserson , and Ronald L. Rivest . Introduction to Algorithms , McGraw Hill , 1990 .]] Thomas H. Cormen, Charles E. Leiserson, and Ronald L. Rivest. Introduction to Algorithms, McGraw Hill, 1990.]]"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/129888.129894"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007607513941"},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of the International Conference on Machine Learning","author":"Domingos P.","year":"2001","unstructured":"P. Domingos and G. Hulten . A general method for scaling up machine learning algorithms and its applications to clustering . In Proceedings of the International Conference on Machine Learning , 2001 .]] P. Domingos and G. Hulten. A general method for scaling up machine learning algorithms and its applications to clustering. In Proceedings of the International Conference on Machine Learning, 2001.]]"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/319682.319698"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.5555\/382019.382409"},{"key":"e_1_3_2_1_13_1","first-page":"181","volume-title":"Proceedings of the 12th VLDB Conference","author":"Fang M. T.","year":"1986","unstructured":"M. T. Fang , R. C. T. Lee , and C. C. Chang . The idea of de-clustering and its applications . In Proceedings of the 12th VLDB Conference , pages 181 -- 188 , 1986 .]] M. T. Fang, R. C. T. Lee, and C. C. Chang. The idea of de-clustering and its applications. In Proceedings of the 12th VLDB Conference, pages 181--188, 1986.]]"},{"key":"e_1_3_2_1_14_1","volume-title":"Morgan Kauffman","author":"Han J.","year":"2001","unstructured":"J. Han and M. Kamber . Data Mining: Concepts and Techniques . Morgan Kauffman , 2001 .]] J. Han and M. Kamber. Data Mining: Concepts and Techniques. Morgan Kauffman, 2001.]]"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/1007568.1007603"},{"key":"e_1_3_2_1_16_1","volume-title":"Proceedings of the International Conference on Knowledge Discovery and Data Mining","author":"John G.","year":"1996","unstructured":"G. John and P. Langley . Static versus dynamic sampling for data mining . In Proceedings of the International Conference on Knowledge Discovery and Data Mining , 1996 .]] G. John and P. Langley. Static versus dynamic sampling for data mining. In Proceedings of the International Conference on Knowledge Discovery and Data Mining, 1996.]]"},{"key":"e_1_3_2_1_17_1","first-page":"61","volume-title":"Proceedings of the 1994 Symposium on Operating Systems Design and Implementation","author":"Kotz David","year":"1994","unstructured":"David Kotz . Disk-directed I\/ O for MIMD multiprocessors. In Proceedings of the 1994 Symposium on Operating Systems Design and Implementation , pages 61 -- 74 . ACM Press , November 1994 .]] David Kotz. Disk-directed I\/O for MIMD multiprocessors. In Proceedings of the 1994 Symposium on Operating Systems Design and Implementation, pages 61--74. ACM Press, November 1994.]]"},{"key":"e_1_3_2_1_18_1","first-page":"373","volume-title":"Proceedings of the International Conference on Data Engineering","author":"Liu Duen-Ren","year":"1995","unstructured":"Duen-Ren Liu and Shashi Shekhar . A similarity graph-based approach to declustering problems and its applications towards parallelizing grid files . In Proceedings of the International Conference on Data Engineering , pages 373 -- 381 , Taipei, Taiwan , March 1995 . IEEE Computer Society Press.]] Duen-Ren Liu and Shashi Shekhar. A similarity graph-based approach to declustering problems and its applications towards parallelizing grid files. In Proceedings of the International Conference on Data Engineering, pages 373--381, Taipei, Taiwan, March 1995. IEEE Computer Society Press.]]"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.5555\/951949.952127"},{"key":"e_1_3_2_1_20_1","volume-title":"Morgan Kaufmann Publishers","author":"May John M.","year":"2000","unstructured":"John M. May . Parallel I\/O for High Performance Computing . Morgan Kaufmann Publishers , 2000 .]] John M. May. Parallel I\/O for High Performance Computing. Morgan Kaufmann Publishers, 2000.]]"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/645606.661024"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/237578.237639"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.5555\/88169.88188"},{"key":"e_1_3_2_1_24_1","volume-title":"Proceeding of the IEEE GlobeCom Global Internet Symposium","author":"Pan J.","year":"2002","unstructured":"J. Pan , C. Faloutsos , and S. Seshan . Fastcars: Fast, correlation-aware sampling for network data mining . In Proceeding of the IEEE GlobeCom Global Internet Symposium , 2002 .]] J. Pan, C. Faloutsos, and S. Seshan. Fastcars: Fast, correlation-aware sampling for network data mining. In Proceeding of the IEEE GlobeCom Global Internet Symposium, 2002.]]"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.5555\/844380.844755"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/582034.582051"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/312129.312188"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1009876119989"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/224170.224371"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.5555\/872748.873252"},{"issue":"6","key":"e_1_3_2_1_31_1","first-page":"70","article-title":"Optimized I\/O for parallel applications","volume":"29","author":"Thakur Rajeev","year":"1996","unstructured":"Rajeev Thakur , Alok Choudhary , Rajesh Bordawekar , Sachin More , and Sivaramakrishna Kuditipudi . Passion : Optimized I\/O for parallel applications . IEEE Computer , 29 ( 6 ): 70 -- 78 , June 1996 .]] Rajeev Thakur, Alok Choudhary, Rajesh Bordawekar, Sachin More, and Sivaramakrishna Kuditipudi. Passion: Optimized I\/O for parallel applications. IEEE Computer, 29(6):70--78, June 1996.]]","journal-title":"IEEE Computer"},{"key":"e_1_3_2_1_32_1","volume-title":"Proceedings of the International Conference on Very Large Databases","author":"Toivonen H.","year":"1996","unstructured":"H. Toivonen . Sampling large databases for associations . In Proceedings of the International Conference on Very Large Databases , 1996 .]] H. Toivonen. Sampling large databases for associations. In Proceedings of the International Conference on Very Large Databases, 1996.]]"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3147.3165"},{"key":"e_1_3_2_1_34_1","volume-title":"Proceedings of the International Conference on Knowledge Discovery and Data Mining","author":"Zaki M.","year":"1997","unstructured":"M. Zaki , S. Parthasarathy , M. Ogihara , and W. Li . New algorithms for fast discovery of association rules . In Proceedings of the International Conference on Knowledge Discovery and Data Mining , 1997 .]] M. Zaki, S. Parthasarathy, M. Ogihara, and W. Li. New algorithms for fast discovery of association rules. In Proceedings of the International Conference on Knowledge Discovery and Data Mining, 1997.]]"}],"event":{"name":"ICS05: International Conference on Supercomputing 2005","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"],"location":"Cambridge Massachusetts","acronym":"ICS05"},"container-title":["Proceedings of the 19th annual international conference on Supercomputing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1088149.1088162","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1088149.1088162","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T16:08:13Z","timestamp":1750262893000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1088149.1088162"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005,6,20]]},"references-count":34,"alternative-id":["10.1145\/1088149.1088162","10.1145\/1088149"],"URL":"https:\/\/doi.org\/10.1145\/1088149.1088162","relation":{},"subject":[],"published":{"date-parts":[[2005,6,20]]},"assertion":[{"value":"2005-06-20","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}