{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T16:32:01Z","timestamp":1760027521105,"version":"3.28.0"},"reference-count":26,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,4]]},"DOI":"10.1109\/infocom.2014.6847984","type":"proceedings-article","created":{"date-parts":[[2014,7,29]],"date-time":"2014-07-29T15:18:13Z","timestamp":1406647093000},"page":"592-600","source":"Crossref","is-referenced-by-count":15,"title":["SAP: Similarity-aware partitioning for efficient cloud storage"],"prefix":"10.1109","author":[{"given":"Bharath","family":"Balasubramanian","sequence":"first","affiliation":[]},{"given":"Tian","family":"Lan","sequence":"additional","affiliation":[]},{"given":"Mung","family":"Chiang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1145\/2078861.2078864"},{"key":"17","first-page":"2","article-title":"Finding similar files in a large file system","author":"manber","year":"0","journal-title":"WTEC'94 Proceedings of the USENIX Winter 1994 Technical Conference on USENIX Winter 1994 Technical Conference"},{"key":"18","first-page":"4","article-title":"Glimpse: A tool to search through entire file systems","author":"manber","year":"0","journal-title":"WTEC'94 Proceedings of the USENIX Winter 1994 Technical Conference on USENIX Winter 1994 Technical Conference"},{"key":"15","first-page":"219","article-title":"Engineering a differencing and compression data format","author":"korn","year":"2002","journal-title":"Proceedings of the General Track of the Annual Conference on USENIX Annual Technical Conference ATEC '02"},{"journal-title":"A separator theorem for planar graphs","year":"1977","author":"lipton","key":"16"},{"key":"13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30538-5_29"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1145\/1644893.1644918"},{"key":"11","first-page":"1199","article-title":"Rcfile: A fast and space-efficient data placement structure in mapreducebased warehouse systems","author":"he","year":"0","journal-title":"Proceedings of the 2011 IEEE 27th International Conference on Data Engineering ICDE '11"},{"key":"12","first-page":"301","article-title":"Duplicate data elimination in a SAN file system","author":"hong","year":"2004","journal-title":"22nd IEEE \/ 13th NASA Goddard Conference on Mass Storage Systems and Technologies (MSST)"},{"key":"21","article-title":"Venti: A new approach to archival data storage","author":"quinlan","year":"2002","journal-title":"Proceedings of the 1st USENIX Conference on File and Storage Technologies FAST '02"},{"key":"20","first-page":"257","article-title":"Clusterbased delta compression of a collection of files","author":"ouyang","year":"2002","journal-title":"Proceedings of the 3rd International Conference on Web Information Systems Engineering WISE '02"},{"journal-title":"A Comparison of Document Clustering Techniques","year":"2000","author":"steinbach","key":"22"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1002\/spe.4380150703"},{"journal-title":"Compression File Collections with A Tsp-based Approach","year":"2004","author":"trendafilov","key":"24"},{"key":"25","doi-asserted-by":"publisher","DOI":"10.1016\/j.dam.2006.10.012"},{"key":"26","first-page":"181","article-title":"Avoiding the disk bottleneck in the data domain deduplication file system","author":"zhu","year":"2008","journal-title":"Proceedings of the 6th USENIX Conference on File and Storage Technologies FAST'08"},{"journal-title":"SAP Similarity-aware Partitioning for Efficient Cloud Storage","year":"2013","author":"balasubramanian","key":"3"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/WCRE.1995.514697"},{"key":"10","doi-asserted-by":"crossref","first-page":"601","DOI":"10.1017\/S0305004100068857","article-title":"A new method for generating bonferronitype inequalities by iteration","volume":"107","author":"galambos","year":"1998","journal-title":"Mathematical Proceedings of the Cambridge Philosophical Society"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1109\/DCC.2001.917151"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2002.1022312"},{"key":"6","first-page":"8","article-title":"Decentralized deduplication in san cluster file systems","author":"clements","year":"0","journal-title":"Proceedings of the 2009 Conference on USENIX Annual Technical Conference USENIX"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1145\/266220.266223"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1145\/1879141.1879175"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1145\/1081870.1081916"},{"key":"8","first-page":"113","article-title":"Application-specific delta-encoding via resemblance detection","author":"douglis","year":"2003","journal-title":"Proc General Track 2003 Usenix Ann Technical Conf"}],"event":{"name":"IEEE INFOCOM 2014 - IEEE Conference on Computer Communications","start":{"date-parts":[[2014,4,27]]},"location":"Toronto, ON, Canada","end":{"date-parts":[[2014,5,2]]}},"container-title":["IEEE INFOCOM 2014 - IEEE Conference on Computer Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6839150\/6847911\/06847984.pdf?arnumber=6847984","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,22]],"date-time":"2017-06-22T17:29:40Z","timestamp":1498152580000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6847984\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,4]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/infocom.2014.6847984","relation":{},"subject":[],"published":{"date-parts":[[2014,4]]}}}