{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T19:56:33Z","timestamp":1772913393877,"version":"3.50.1"},"reference-count":28,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2018,2,6]],"date-time":"2018-02-06T00:00:00Z","timestamp":1517875200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Grid Computing"],"published-print":{"date-parts":[[2018,6]]},"DOI":"10.1007\/s10723-018-9429-3","type":"journal-article","created":{"date-parts":[[2018,2,5]],"date-time":"2018-02-05T22:15:28Z","timestamp":1517868928000},"page":"195-209","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["DCDedupe: Selective Deduplication and Delta Compression with Effective Routing for Distributed Storage"],"prefix":"10.1007","volume":"16","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9489-7653","authenticated-orcid":false,"given":"Binqi","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Chen","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Bing Bing","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Dong","family":"Yuan","sequence":"additional","affiliation":[]},{"given":"Albert Y.","family":"Zomaya","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,2,6]]},"reference":[{"key":"9429_CR1","doi-asserted-by":"crossref","unstructured":"Shvachko, K., Kuang, H., Radia, S., Chansler, R.: The Hadoop distributed file system. In: 2010 IEEE 26th Symposium on Mass Storage Systems and Technologies (MSST). IEEE, pp. 1\u201310 (2010)","DOI":"10.1109\/MSST.2010.5496972"},{"key":"9429_CR2","doi-asserted-by":"crossref","unstructured":"Meister, D., Brinkmann, A.: Multi-level comparison of data deduplication in a backup scenario. In: Proceedings of SYSTOR 2009: The Israeli Experimental Systems Conference. ACM, p 8 (2009)","DOI":"10.1145\/1534530.1534541"},{"key":"9429_CR3","unstructured":"MacDonald, J.: File system support for delta compression. Masters thesis, Department of Electrical Engineering and Computer Science, University of California at Berkeley (2000)"},{"key":"9429_CR4","unstructured":"Shilane, P., Wallace, G., Huang, M., Hsu, W.: Delta compressed and deduplicated storage using stream-informed locality. In: Proceedings of the 4th USENIX Conference on Hot Topics in Storage and File Systems. USENIX Association, pp. 10\u201310 (2012)"},{"key":"9429_CR5","doi-asserted-by":"crossref","unstructured":"Xia, W., Jiang, H., Feng, D., Tian, L.: Combining deduplication and delta compression to achieve low-overhead data reduction on backup datasets. In: Data Compression Conference (DCC), 2014. IEEE, pp. 203\u2013212 (2014)","DOI":"10.1109\/DCC.2014.38"},{"key":"9429_CR6","unstructured":"Chen, F., Luo, T., Zhang, X.: CAFTL: a content-aware flash translation layer enhancing the lifespan of flash memory based solid state drives. In: FAST, vol. 11 (2011)"},{"key":"9429_CR7","unstructured":"Broder, A.Z.: On the resemblance and containment of documents. In: Compression and Complexity of Sequences 1997. Proceedings. IEEE, pp. 21\u201329 (1997)"},{"key":"9429_CR8","doi-asserted-by":"crossref","unstructured":"Aronovich, L., Asher, R., Bachmat, E., Bitner, H., Hirsch, M., Klein, S.T.: The design of a similarity based deduplication system. In: Proceedings of SYSTOR 2009: The Israeli Experimental Systems Conference. ACM, p 6 (2009)","DOI":"10.1145\/1534530.1534539"},{"issue":"1","key":"9429_CR9","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1145\/2611778","volume":"47","author":"J Paulo","year":"2014","unstructured":"Paulo, J., Pereira, J.: A survey and classification of storage deduplication systems. ACM Comput. Surv. (CSUR) 47(1), 11 (2014)","journal-title":"ACM Comput. Surv. (CSUR)"},{"key":"9429_CR10","unstructured":"Xia, W., Jiang, H., Feng, D., Hua, Y.: SiLo: a similarity-locality based near-exact deduplication scheme with low ram overhead and high throughput. In: USENIX Annual Technical Conference (2011)"},{"key":"9429_CR11","unstructured":"Fu, M., Feng, D., Hua, Y., He, X., Chen, Z., Xia, W., Zhang, Y., Tan, Y.: Design tradeoffs for data deduplication performance in backup workloads. In: 13th USENIX Conference on File and Storage Technologies (FAST 15), pp. 331\u2013344. USENIX Association, Santa Clara (2015). [Online]. Available: https:\/\/www.usenix.org\/conference\/fast15\/technical-sessions\/presentation\/fu"},{"key":"9429_CR12","doi-asserted-by":"crossref","unstructured":"Bhagwat, D., Eshghi, K., Long, D.D., Lillibridge, M.: Extreme binning: scalable, parallel deduplication for chunk-based file backup. In: IEEE International Symposium on Modeling, Analysis & Simulation of Computer and Telecommunication Systems, 2009. MASCOTS\u201909. IEEE, pp. 1\u20139 (2009)","DOI":"10.1109\/MASCOT.2009.5366623"},{"key":"9429_CR13","doi-asserted-by":"publisher","first-page":"258","DOI":"10.1016\/j.peva.2014.07.016","volume":"79","author":"W Xia","year":"2014","unstructured":"Xia, W., Jiang, H., Feng, D., Tian, L., Fu, M., Zhou, Y.: Ddelta: a deduplication-inspired fast delta compression approach. Perform. Eval. 79, 258\u2013272 (2014)","journal-title":"Perform. Eval."},{"key":"9429_CR14","unstructured":"Xdelta: Xdelta. [Online]. Available: https:\/\/xdelta.org\/"},{"issue":"4","key":"9429_CR15","first-page":"13","volume":"8","author":"P Shilane","year":"2012","unstructured":"Shilane, P., Huang, M., Wallace, G., Hsu, W.: Wan-optimized replication of backup datasets using stream-informed delta compression. ACM Trans. Storage (TOS) 8(4), 13 (2012)","journal-title":"ACM Trans. Storage (TOS)"},{"key":"9429_CR16","unstructured":"Zhu, B., Li, K., Patterson R.H.: Avoiding the disk bottleneck in the data domain deduplication file system. In: Fast, vol. 8, pp. 1\u201314 (2008)"},{"key":"9429_CR17","doi-asserted-by":"crossref","unstructured":"Meister, D., Brinkmann, A.: dedupv1: improving deduplication throughput using solid state drives (ssd). In: 2010 IEEE 26th Symposium on Mass Storage Systems and Technologies (MSST). IEEE, pp. 1\u20136 (2010)","DOI":"10.1109\/MSST.2010.5496992"},{"key":"9429_CR18","doi-asserted-by":"crossref","unstructured":"Wildani, A., Miller, E.L., Rodeh, O.: HANDS: a heuristically arranged non-backup in-line deduplication system. In: 2013 IEEE 29th International Conference on Data Engineering (ICDE). IEEE, pp. 446\u2013457 (2013)","DOI":"10.1109\/ICDE.2013.6544846"},{"key":"9429_CR19","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Wu, Y., Yang, G.: Droplet: a distributed solution of data deduplication. In: Proceedings of the 2012 ACM\/IEEE 13th International Conference on Grid Computing. IEEE Computer Society, pp. 114\u2013121 (2012)","DOI":"10.1109\/Grid.2012.21"},{"key":"9429_CR20","doi-asserted-by":"crossref","unstructured":"Jin, K., Miller, E.L.: The effectiveness of deduplication on virtual machine disk images. In: Proceedings of SYSTOR 2009: The Israeli Experimental Systems Conference. ACM, p 7 (2009)","DOI":"10.1145\/1534530.1534540"},{"key":"9429_CR21","doi-asserted-by":"crossref","unstructured":"Tan, Y., Jiang, H., Feng, D., Tian, L., Yan, Z., Zhou, G.: Sam: a semantic-aware multi-tiered source de-duplication framework for cloud backup. In: 2010 39th International Conference on Parallel Processing (ICPP). IEEE, pp. 614\u2013623 (2010)","DOI":"10.1109\/ICPP.2010.69"},{"issue":"5","key":"9429_CR22","doi-asserted-by":"publisher","first-page":"1155","DOI":"10.1109\/TPDS.2013.167","volume":"25","author":"Y Fu","year":"2014","unstructured":"Fu, Y., Jiang, H., Xiao, N., Tian, L., Liu, F., Xu, L.: Application-aware local-global source deduplication for cloud backup services of personal storage. IEEE Trans. Parallel Distrib. Syst. 25 (5), 1155\u20131165 (2014)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"9429_CR23","unstructured":"Mandal, S., Kuenning, G., Ok, D., Shastry, V., Shilane, P., Zhen, S., Tarasov, V., Zadok, E.: Using hints to improve inline block-layer deduplication. In: The 14th USENIX Conference on File and Storage Technologies (FAST). Santa Clara (2016)"},{"key":"9429_CR24","unstructured":"Lin, X., Douglis, F., Li, J., Li, X., Ricci, R., Smaldone, S., Wallace, G.: Metadata considered harmful...to deduplication. In: 7th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage 15) (2015)"},{"key":"9429_CR25","unstructured":"Eshghi, K., Tang, H.K.: A framework for analyzing and improving content-based chunking algorithms. Hewlett-Packard Labs Technical Report TR, vol. 30, p. 2005 (2005)"},{"key":"9429_CR26","doi-asserted-by":"crossref","unstructured":"Zhang, B., Wang, C., Zhou, B. B., Zomaya, A.Y.: Inline data deduplication for ssd-based distributed storage. In: 2015 IEEE 21st International Conference on Parallel and Distributed Systems (ICPADS). IEEE, pp. 593\u2013600 (2015)","DOI":"10.1109\/ICPADS.2015.80"},{"key":"9429_CR27","unstructured":"EMC Corporation: Isilon Scale-Out NAS and Unstructured Data. [Online]. Available: https:\/\/emc.com\/en-us\/storage\/isilon\/index.htm"},{"key":"9429_CR28","unstructured":"Dong, W., Douglis, F., Li, K., Patterson, R.H., Reddy, S., Shilane, P.: Tradeoffs in scalable data routing for deduplication clusters. In: FAST, vol. 11, pp. 15\u201329 (2011)"}],"container-title":["Journal of Grid Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10723-018-9429-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10723-018-9429-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10723-018-9429-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,10]],"date-time":"2019-10-10T05:22:22Z","timestamp":1570684942000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10723-018-9429-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,2,6]]},"references-count":28,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2018,6]]}},"alternative-id":["9429"],"URL":"https:\/\/doi.org\/10.1007\/s10723-018-9429-3","relation":{},"ISSN":["1570-7873","1572-9184"],"issn-type":[{"value":"1570-7873","type":"print"},{"value":"1572-9184","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,2,6]]},"assertion":[{"value":"28 June 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 January 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 February 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}