{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T15:18:44Z","timestamp":1725549524715},"reference-count":24,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,6]]},"DOI":"10.1109\/msst.2014.6855542","type":"proceedings-article","created":{"date-parts":[[2014,7,29]],"date-time":"2014-07-29T20:15:45Z","timestamp":1406664945000},"page":"1-11","source":"Crossref","is-referenced-by-count":1,"title":["The case for sampling on very large file systems"],"prefix":"10.1109","author":[{"given":"George","family":"Goldberg","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Danny","family":"Harnik","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dmitry","family":"Sotnikov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"19","first-page":"153","article-title":"Spyglass: Fast, scalable metadata search for large-scale storage systems","author":"leung","year":"2009","journal-title":"7th USENIX Conference on File and Storage Technologies (FAST '09)"},{"journal-title":"Introduction to IBM Real-time Compression Appliances","year":"2012","author":"tretau","key":"22"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2012.82"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1145\/3147.3165"},{"journal-title":"An Introduction to Mathematical Statistics and Its Applications Student Solutions Manual","year":"2011","author":"larsen","key":"18"},{"key":"24","doi-asserted-by":"publisher","DOI":"10.1109\/MSST.2013.6558449"},{"journal-title":"Oracle Solaris ZFS Storage Management","year":"2011","author":"kay","key":"15"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1145\/1374596.1374603"},{"key":"13","first-page":"217","article-title":"Just-in-time analytics on large file systems","author":"huang","year":"2011","journal-title":"9th USENIX Conference on File and Storage Technologies (FAST 2011)"},{"journal-title":"Large Sample Techniques for Statistics","year":"2012","author":"jiang","key":"14"},{"key":"11","first-page":"229","article-title":"To zip or not to zip: Effective resource usage for real-time compression","author":"harnik","year":"2013","journal-title":"Proceedings of the 11th USENIX Conference on File and Storage Technologies (FAST 2013)"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.1963.10500830"},{"key":"21","article-title":"Hierarchical file systems are dead","author":"seltzer","year":"2009","journal-title":"Proceedings of the Workshop on Hot Topics in Operating Systems - HOTOS"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1145\/335168.335230"},{"journal-title":"NetApp Data Compression and Deduplication Deployment and Implementation Guide Data ONTAP Operating in Cluster-Mode","year":"2012","author":"moulton","key":"20"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1987.1057314"},{"key":"1","first-page":"125","article-title":"Generating realistic impressions for file-system benchmarking","author":"agrawal","year":"2009","journal-title":"7th USENIX Conference on File and Storage Technologies (FAST '09)"},{"key":"10","first-page":"311","article-title":"Sampling-based estimation of the number of distinct values of an attribute","author":"haas","year":"1995","journal-title":"VLDB'95 Proceedings of 21th International Conference on Very Large Data Bases"},{"journal-title":"Weighted Random Sampling over Data Streams","year":"2010","author":"efraimidis","key":"7"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1109\/CCP.2011.41"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1145\/276304.276343"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1145\/1007568.1007602"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1145\/130283.130335"},{"key":"8","first-page":"466","article-title":"Fast incremental maintenance of approximate histograms","author":"gibbons","year":"1997","journal-title":"VLDB'97 Proceedings of 23rd International Conference on Very Large Data Bases"}],"event":{"name":"2014 30th Symposium on Mass Storage Systems and Technologies (MSST)","start":{"date-parts":[[2014,6,2]]},"location":"Santa Clara, CA, USA","end":{"date-parts":[[2014,6,6]]}},"container-title":["2014 30th Symposium on Mass Storage Systems and Technologies (MSST)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6849599\/6855532\/06855542.pdf?arnumber=6855542","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,23]],"date-time":"2017-03-23T19:16:41Z","timestamp":1490296601000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6855542\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,6]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/msst.2014.6855542","relation":{},"subject":[],"published":{"date-parts":[[2014,6]]}}}