{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T05:01:12Z","timestamp":1773378072245,"version":"3.50.1"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,7,12]],"date-time":"2021-07-12T00:00:00Z","timestamp":1626048000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,7,12]],"date-time":"2021-07-12T00:00:00Z","timestamp":1626048000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,7,12]]},"DOI":"10.1109\/isit45174.2021.9517909","type":"proceedings-article","created":{"date-parts":[[2021,9,1]],"date-time":"2021-09-01T16:52:42Z","timestamp":1630515162000},"page":"3296-3301","source":"Crossref","is-referenced-by-count":3,"title":["Asymptotic Analysis of Data Deduplication with a Constant Number of Substitutions"],"prefix":"10.1109","author":[{"given":"Hao","family":"Lou","sequence":"first","affiliation":[{"name":"University of Virginia,Electrical and Computer Engineering,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Farzad Farnoud","family":"Hassanzadeh","sequence":"additional","affiliation":[{"name":"University of Virginia,Electrical and Computer Engineering,VA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","first-page":"419","article-title":"Endre: An end-system redundancy elimination service for enterprises","author":"agarwal","year":"2010","journal-title":"NSDI"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2015.7218510"},{"key":"ref12","first-page":"1","article-title":"Leap-based content defined chunkingatheory and implementation","author":"yu","year":"2015","journal-title":"2015 31 st Symposium on Mass Storage Systems and Technologies (MSST)"},{"key":"ref13","first-page":"239","article-title":"Bimodal content defined chunking for backup streams","author":"kruus","year":"2010","journal-title":"FAST"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MASCOTS.2010.37"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2013.48"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"860","DOI":"10.1038\/35057062","article-title":"Initial sequencing and analysis of the human genome","volume":"409","author":"lander","year":"2001","journal-title":"Nature"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2016.2571298"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT44484.2020.9174380"},{"key":"ref19","article-title":"General-ized deduplication: Bounds, convergence, and asymptotic properties","author":"vestergaard","year":"2019","journal-title":"ArXiv Preprint"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/502059.502052"},{"key":"ref3","first-page":"285","article-title":"Primary data deduplicationalarge scale study and system design","author":"ei-shimi","year":"2012","journal-title":"Presented as part of the 2012 USENIX Annual Technical Conference"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2019.2916037"},{"key":"ref5","first-page":"89","article-title":"Venti: A new approach to archival storage","volume":"2","author":"quinlan","year":"2002","journal-title":"FAST"},{"key":"ref8","first-page":"1","article-title":"Fin-gerdiff: Improved duplicate elimination in storage systems","author":"bobbarjung","year":"2006","journal-title":"Proc of the Mass Storage Systems and Technologies (MSST)"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.peva.2014.07.016"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2078861.2078864"},{"key":"ref1","first-page":"1","article-title":"The digital universe in 2020: Big data, bigger digital shadows, and biggest growth in the far east","volume":"2007","author":"gantz","year":"2012","journal-title":"IDC IView IDC Analyze the Future"},{"key":"ref9","author":"teodosiu","year":"2006","journal-title":"Optimizing file replication over limited bandwidth networks using remote differential compression"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/GLOCOM.2018.8647415"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/1210596.1210599"},{"key":"ref21","article-title":"A framework for analyzing and improving content-based chunking algorithms","volume":"30","author":"eshghi","year":"2005","journal-title":"Hewlett-packard Labs Technical Report TR"},{"key":"ref24","author":"sedgewick","year":"2013","journal-title":"An Introduction to the Analysis of Algorithms"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1975.1055349"}],"event":{"name":"2021 IEEE International Symposium on Information Theory (ISIT)","location":"Melbourne, Australia","start":{"date-parts":[[2021,7,12]]},"end":{"date-parts":[[2021,7,20]]}},"container-title":["2021 IEEE International Symposium on Information Theory (ISIT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9517708\/9517709\/09517909.pdf?arnumber=9517909","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T20:36:09Z","timestamp":1773347769000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9517909\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,12]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/isit45174.2021.9517909","relation":{},"subject":[],"published":{"date-parts":[[2021,7,12]]}}}