{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T16:14:33Z","timestamp":1761581673488,"version":"3.37.3"},"reference-count":53,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2018,3,7]],"date-time":"2018-03-07T00:00:00Z","timestamp":1520380800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2018,3,7]],"date-time":"2018-03-07T00:00:00Z","timestamp":1520380800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100000181","name":"Air Force Office of Scientific Research","doi-asserted-by":"publisher","award":["FA9550-14-1-0160"],"award-info":[{"award-number":["FA9550-14-1-0160"]}],"id":[{"id":"10.13039\/100000181","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-1156574","CNS-1449860"],"award-info":[{"award-number":["CNS-1156574","CNS-1449860"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CNS-1527346"],"award-info":[{"award-number":["CNS-1527346"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cluster Comput"],"published-print":{"date-parts":[[2018,9]]},"DOI":"10.1007\/s10586-018-2141-z","type":"journal-article","created":{"date-parts":[[2018,3,7]],"date-time":"2018-03-07T13:48:47Z","timestamp":1520430527000},"page":"1561-1579","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["EAD: elasticity aware deduplication manager for datacenters with multi-tier storage systems"],"prefix":"10.1007","volume":"21","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9822-5843","authenticated-orcid":false,"given":"Zhengyu","family":"Yang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yufeng","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Janki","family":"Bhamini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chiu C.","family":"Tan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ningfang","family":"Mi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,3,7]]},"reference":[{"issue":"12","key":"2141_CR1","first-page":"15","volume":"41","author":"D Geer","year":"2008","unstructured":"Geer, D.: Reducing the storage burden via data deduplication. IEEE Trans. Comput. 41(12), 15\u201317 (2008)","journal-title":"IEEE Trans. Comput."},{"unstructured":"Fu, M., Feng, D., Hua, Y., He, X., Chen, Z., Xia, W., Tan, Y.: Design tradeoffs for data deduplication performance in backup workloads. In: 13th USENIX Conference on File and Storage Technologies (FAST 15), pp. 331\u2013344 (2015)","key":"2141_CR2"},{"issue":"6","key":"2141_CR3","doi-asserted-by":"publisher","first-page":"1012","DOI":"10.1007\/s11390-013-1394-5","volume":"28","author":"YJ Fu","year":"2013","unstructured":"Fu, Y.J., Xiao, N., Liao, X.K., Liu, F.: Application-aware client-side data reduction and encryption of personal data in cloud backup services. J. Comput. Sci. Technol. (JCST) 28(6), 1012 (2013)","journal-title":"J. Comput. Sci. Technol. (JCST)"},{"unstructured":"Berliner, B.: Multi-tier cache and method for implementing such a system. US Patent 5,787,466 (1998)","key":"2141_CR4"},{"doi-asserted-by":"crossref","unstructured":"Spillane, R.P., Shetty, P.J., Zadok, E., Dixit, S., Archak, S.: An efficient multi-tier tablet server storage architecture. In: Proceedings of the 2nd ACM Symposium on Cloud Computing, ACM, p. 1 (2011)","key":"2141_CR5","DOI":"10.1145\/2038916.2038917"},{"unstructured":"Lillibridge, M., Eshghi, K., Bhagwat, D., Deolalikar, V., Trezise, G., Camble, P.:Sparse indexing: large scale, inline deduplication using sampling and locality. In: Proccedings of the 7th Conference on File and Storage Technologies (2009)","key":"2141_CR6"},{"unstructured":"Guo, F., Efstathopoulos, P.: Building a high performance deduplication system. In: Proceedings of the 2011 USENIX Conference on USENIX Annual Technical Conference (2011)","key":"2141_CR7"},{"key":"2141_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/844128.844130","volume":"36","author":"A Adya","year":"2002","unstructured":"Adya, A., Bolosky, W.J., et al.: FARSITE: federated, available, and reliable storage for an incompletely trusted environment. ACM SIGOPS Oper. Syst. Rev. 36, 1\u201314 (2002)","journal-title":"ACM SIGOPS Oper. Syst. Rev."},{"doi-asserted-by":"crossref","unstructured":"Forman, G., Eshghi, K., Chiocchetti, S.: Finding similar files in large document repositories. In: Proceedings of the Eleventh ACM SIGKDD International Conference on Knowledge Discovery in Data Mining (2005)","key":"2141_CR9","DOI":"10.1145\/1081870.1081916"},{"unstructured":"Manber, U., et\u00a0al.: Finding similar files in a large file system. In: Proceedings of the USENIX Winter 1994 Technical Conference (1994)","key":"2141_CR10"},{"doi-asserted-by":"crossref","unstructured":"Broder, A.Z.: Some applications of Rabins fingerprinting method. In: Sequences II, pp. 143\u2013152. Springer, New York (1993)","key":"2141_CR11","DOI":"10.1007\/978-1-4613-9323-8_11"},{"doi-asserted-by":"crossref","unstructured":"Bhagwat, D., Eshghi, K., Long, D.D., Lillibridge, M.: Extreme binning: scalable, parallel deduplication for chunk-based file backup. In: IEEE International Symposium on Modeling, Analysis & Simulation of Computer and Telecommunication Systems, pp. 1\u20139 (2009)","key":"2141_CR12","DOI":"10.1109\/MASCOT.2009.5366623"},{"unstructured":"Dutch, M.: Understanding data deduplication ratios. In: SNIA Data Management Forum, p. 7 (2008)","key":"2141_CR13"},{"unstructured":"Kim, C., Park, K.W., et\u00a0al.: Rethinking deduplication in cloud: From data profiling to blueprint. In: 2011 7th International Conference on Networked Computing and Advanced Information Management (NCM), pp. 101\u2013104 (2011)","key":"2141_CR14"},{"doi-asserted-by":"crossref","unstructured":"Yang, Q., Ren, J.: I-CASH: intelligently coupled array of SSD and HDD. In: 2011 IEEE 17th International Symposium on High Performance Computer Architecture (HPCA), pp. 278\u2013289. IEEE (2011)","key":"2141_CR15","DOI":"10.1109\/HPCA.2011.5749736"},{"doi-asserted-by":"crossref","unstructured":"Harnik, D., Margalit, O., Naor, D., Sotnikov, D., Vernik, G.: Estimation of deduplication ratios in large data sets. In: 2012 IEEE 28th Symposium on Mass Storage Systems and Technologies (MSST) (2012)","key":"2141_CR16","DOI":"10.1109\/MSST.2012.6232381"},{"unstructured":"Hibler, M., Stoller, L.D., et\u00a0al.: Fast, Scalable Disk Imaging with Frisbee. In: USENIX Annual Technical Conference, General Track (2003)","key":"2141_CR17"},{"issue":"7","key":"2141_CR18","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1145\/362686.362692","volume":"13","author":"BH Bloom","year":"1970","unstructured":"Bloom, B.H.: Space\/time trade-offs in hash coding with allowable errors. Commun. ACM 13(7), 422\u2013426 (1970)","journal-title":"Commun. ACM"},{"unstructured":"Wikimedia Downloads Historical Archives. \n                    http:\/\/dumps.wikimedia.org\/archive\/\n                    \n                  . Accessed 04 2013","key":"2141_CR19"},{"unstructured":"OpenfMRI Datasets. \n                    https:\/\/openfmri.org\/data-sets\n                    \n                  . Accessed 05 2013","key":"2141_CR20"},{"unstructured":"Wallace, G., Douglis, F., Qian, H., Shilane, P., Smaldone, S., Chamness, M., Hsu, W.: Characteristics of backup workloads in production systems. In: FAST, vol. 12 (2012)","key":"2141_CR21"},{"doi-asserted-by":"crossref","unstructured":"Zhou, R., Liu, M., Li, T.: Characterizing the efficiency of data deduplication for big data storage management. In: 2013 IEEE International Symposium on Workload Characterization (IISWC), pp. 98\u2013108. IEEE (2013)","key":"2141_CR22","DOI":"10.1109\/IISWC.2013.6704674"},{"doi-asserted-by":"crossref","unstructured":"O\u2019Neil, E., O\u2019Neil, P., Weikum, G.: The LRU-K page replacement algorithm for database disk buffering. In: Proceedings of the 1993 ACM SIGMOD International Conference on Management of data, Washington, DC, pp. 297\u2013306 (1993)","key":"2141_CR23","DOI":"10.1145\/170036.170081"},{"issue":"2","key":"2141_CR24","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1147\/sj.52.0078","volume":"5","author":"LA Belady","year":"1966","unstructured":"Belady, L.A.: A study of replacement algorithms for a virtual-storage computer. IBM Syst. J. 5(2), 78\u2013101 (1966)","journal-title":"IBM Syst. J."},{"unstructured":"Megiddo, N., Modha, D.: ARC: a self-tuning, low overhead replacement cache. In: Proceedings of the 2nd USENIX Conference on File and Storage Technologies, San Francisco, CA, pp. 115\u2013130 (2003)","key":"2141_CR25"},{"unstructured":"Bansal, S., Modha, D.S.: CAR: clock with adaptive replacement. In: Proceedings of the 2th USENIX Conference on File and Storage Technologies, vol. 4, pp. 187\u2013200 (2004)","key":"2141_CR26"},{"unstructured":"Sabaa, A., Kumar, P.D., et\u00a0al.: Inline wire speed deduplication system. US Patent App. 12\/797,032 (2010)","key":"2141_CR27"},{"unstructured":"You, L.L., Karamanolis, C.: Evaluation of efficient archival storage techniques. In: Proceedings of the 21st IEEE\/12th NASA Goddard Conference on Mass Storage Systems and Technologies (2004)","key":"2141_CR28"},{"unstructured":"Kruus, E., Ungureanu, C., Dubnicki, C.: Bimodal content defined chunking for backup streams. In: Proceedings of the 8th USENIX Conference on File and Storage Technologies (2010)","key":"2141_CR29"},{"issue":"6","key":"2141_CR30","doi-asserted-by":"publisher","first-page":"824","DOI":"10.1109\/TC.2010.263","volume":"60","author":"J Min","year":"2011","unstructured":"Min, J., Yoon, D., Won, Y.: Efficient deduplication techniques for modern backup operation. IEEE Trans. Comput. 60(6), 824\u2013840 (2011)","journal-title":"IEEE Trans. Comput."},{"issue":"5","key":"2141_CR31","doi-asserted-by":"publisher","first-page":"174","DOI":"10.1145\/502059.502052","volume":"35","author":"Athicha Muthitacharoen","year":"2001","unstructured":"Muthitacharoen, A., Chen, B., Mazieres, D.: A low-bandwidth network file system. In: ACM SIGOPS Operating Systems Review, vol. 35, pp. 174\u2013187 (2001)","journal-title":"ACM SIGOPS Operating Systems Review"},{"unstructured":"Eshghi, K., Tang, H.K.: A framework for analyzing and improving content-based chunking algorithms, Hewlett-Packard Labs Technical Report TR (2005)","key":"2141_CR32"},{"unstructured":"Xia, W., Jiang, H.D., et\u00a0al.: Silo: a similarity-locality based near-exact deduplication scheme with low ram overhead and high throughput. In: Proceedings of USENIX Annual Technical Conference (2011)","key":"2141_CR33"},{"unstructured":"Debnath, B.K., Sengupta, S., Li, J.: ChunkStash: speeding up inline storage deduplication using flash memory. In: USENIX Annual Technical Conference (2010)","key":"2141_CR34"},{"doi-asserted-by":"crossref","unstructured":"Feng, J., Schindler, J.: A deduplication study for host-side caches in virtualized data center environments. In: 2013 IEEE 29th Symposium on Mass Storage Systems and Technologies (MSST), pp. 1\u20136. IEEE (2013)","key":"2141_CR35","DOI":"10.1109\/MSST.2013.6558437"},{"unstructured":"Li, C., Shilane, P., Douglis, F., Shim, H., Smaldone, S., Wallace, G.: Nitro: a capacity-optimized SSD cache for primary storage. In: 2014 USENIX Annual Technical Conference (USENIX ATC 14), pp. 501\u2013512 (2014)","key":"2141_CR36"},{"doi-asserted-by":"crossref","unstructured":"Wang, Y., Tan, C.C., Mi, N.: Using elasticity to improve inline data deduplication storage systems. In: 2014 IEEE 7th International Conference on Cloud Computing (CLOUD), pp. 785\u2013792. IEEE (2014)","key":"2141_CR37","DOI":"10.1109\/CLOUD.2014.109"},{"unstructured":"Zhu, B., Li, K., Patterson, H.: Avoiding the disk bottleneck in the data domain deduplication file system. In: Proceedings of the 6th USENIX Conference on File and Storage Technologies (2008)","key":"2141_CR38"},{"doi-asserted-by":"crossref","unstructured":"Lu, G., Jin, Y., Du, D.H.: Frequency based chunking for data de-duplication, In: 2010 IEEE International Symposium on Modeling, Analysis and Simulation of Computer and Telecommunication Systems. MASCOTS, pp. 287\u2013296. IEEE (2010)","key":"2141_CR39","DOI":"10.1109\/MASCOTS.2010.37"},{"doi-asserted-by":"crossref","unstructured":"Kampe, M., Stenstrom, P., Dubois, M.: Self-correcting LRU Replacement Policies. In: Proceedings of the 1st Conference on Computing frontiers, Ischia, Italy, pp. 181\u2013191 (2004)","key":"2141_CR40","DOI":"10.1145\/977091.977117"},{"unstructured":"Johnson, T., Shasha, D.: 2Q: a low overhead high performance buffer management replacement algorithm. In: Proceedings of the 20th International Conference on Very Large Data Bases, San Francisco, CA, pp. 439\u2013450 (1994)","key":"2141_CR41"},{"unstructured":"Zhou, Y., Philbin, J., Li, K.: The multi-queue replacement algorithm for second level buffer caches. In: Proceedings of the 2001 USENIX Annual Technical Conference, Boston, MA, pp. 91\u2013104 (2001)","key":"2141_CR42"},{"issue":"12","key":"2141_CR43","doi-asserted-by":"publisher","first-page":"1352","DOI":"10.1109\/TC.2001.970573","volume":"50","author":"D Lee","year":"2001","unstructured":"Lee, D., Choi, J., Kim, J.H., Noh, S., Min, S.L., Cho, Y., Kim, C.S.: LRFU: a spectrum of policies that subsumes the least recently used and least frequently used policies. IEEE Trans. Comput. 50(12), 1352\u20131361 (2001)","journal-title":"IEEE Trans. Comput."},{"unstructured":"Guerra, J., Pucha, H., Glider, J., Belluomini, W., Rangaswami, R.: Cost effective storage using extent based dynamic tiering. In: Proceedings of the 9th USENIX Conference on File and Storage Technologies, San Jose, CA (2011)","key":"2141_CR44"},{"issue":"3","key":"2141_CR45","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1109\/TCC.2015.2424886","volume":"5","author":"J Tai","year":"2017","unstructured":"Tai, J., Liu, D., Yang, Z., Zhu, X., Lo, J., Mi, N.: Improving flash resource utilization at minimal management cost in virtualized flash-based storage systems. IEEE Trans. Cloud Comput. 5(3), 537\u2013549 (2017)","journal-title":"IEEE Trans. Cloud Comput."},{"doi-asserted-by":"crossref","unstructured":"Yang, Z., Awasthi, M., Ghosh, M., Mi, N.: A fresh perspective on total cost of ownership models for flash storage in datacenters. In: 2016 IEEE 8th International Conference on Cloud Computing Technology and Science. IEEE (2016)","key":"2141_CR46","DOI":"10.1109\/CloudCom.2016.0049"},{"unstructured":"Yang, Z., Ghosh, M., Awasthi, M., Balakrishnan, V.: Online flash resource allocation manager based on TCO model (2016)","key":"2141_CR47"},{"unstructured":"Yang, Z., Ghosh, M., Awasthi, M., Balakrishnan, V.: Online flash resource migration, allocation, retire and replacement manager based on a cost of ownership model (2016)","key":"2141_CR48"},{"doi-asserted-by":"crossref","unstructured":"Roemer, J., Groman, M., Yang, Z., Wang, Y., Tan, C.C., Mi, N.: Improving virtual machine migration via deduplication. In: 2014 IEEE 11th International Conference on Mobile Ad Hoc and Sensor Systems, pp. 702\u2013707. IEEE (2014)","key":"2141_CR49","DOI":"10.1109\/MASS.2014.74"},{"doi-asserted-by":"crossref","unstructured":"Bhimani, J., Yang, J., Yang, Z., Mi, N., Xu, Q., Awasthi, M., Pandurangan, R., Balakrishnan, V.: Understanding performance of I\/O intensive containerized applications for NVMe SSDs. In: 35th IEEE International Performance Computing and Communications Conference (IPCCC). IEEE d(2016)","key":"2141_CR50","DOI":"10.1109\/PCCC.2016.7820650"},{"key":"2141_CR51","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/j.future.2016.05.028","volume":"65","author":"S Farokhi","year":"2016","unstructured":"Farokhi, S., Jamshidi, P., Lakew, E.B., Brandic, I., Elmroth, E.: A hybrid cloud controller for vertical memory elasticity: a control-theoretic approach. Future Gener. Comput. Syst. 65, 57\u201372 (2016)","journal-title":"Future Gener. Comput. Syst."},{"doi-asserted-by":"crossref","unstructured":"Tang, H., Cui, Y., Guan, C., Wu, J., Weng, J., Ren, K.: Enabling Ciphertext Deduplication for Secure Cloud Storage and Access Control. In: Proceedings of the 11th ACM on Asia Conference on Computer and Communications Security, ACM, pp. 59\u201370 (2016)","key":"2141_CR52","DOI":"10.1145\/2897845.2897846"},{"doi-asserted-by":"crossref","unstructured":"Nicolae, B.: Towards scalable checkpoint restart: A collective inline memory contents deduplication proposal. In: 2013 IEEE 27th International Symposium on Parallel & Distributed Processing (IPDPS), pp. 19\u201328. IEEE (2013)","key":"2141_CR53","DOI":"10.1109\/IPDPS.2013.14"}],"container-title":["Cluster Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10586-018-2141-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-018-2141-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-018-2141-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,17]],"date-time":"2020-05-17T15:16:40Z","timestamp":1589728600000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10586-018-2141-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,3,7]]},"references-count":53,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2018,9]]}},"alternative-id":["2141"],"URL":"https:\/\/doi.org\/10.1007\/s10586-018-2141-z","relation":{},"ISSN":["1386-7857","1573-7543"],"issn-type":[{"type":"print","value":"1386-7857"},{"type":"electronic","value":"1573-7543"}],"subject":[],"published":{"date-parts":[[2018,3,7]]},"assertion":[{"value":"5 May 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 January 2018","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 February 2018","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 March 2018","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}