{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T06:29:02Z","timestamp":1761719342860,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":54,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,3,30]],"date-time":"2025-03-30T00:00:00Z","timestamp":1743292800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,3,30]]},"DOI":"10.1145\/3689031.3717493","type":"proceedings-article","created":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T06:25:20Z","timestamp":1742970320000},"page":"1026-1043","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Garbage Collection Does Not Only Collect Garbage: Piggybacking-Style Defragmentation for Deduplicated Backup Storage"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-9702-6678","authenticated-orcid":false,"given":"Dingbang","family":"Liu","sequence":"first","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5104-8301","authenticated-orcid":false,"given":"Xiangyu","family":"Zou","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2362-2446","authenticated-orcid":false,"given":"Tao","family":"Lu","sequence":"additional","affiliation":[{"name":"DapuStor, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1235-0502","authenticated-orcid":false,"given":"Philip","family":"Shilane","sequence":"additional","affiliation":[{"name":"Dell Technologies, Boston, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4093-6391","authenticated-orcid":false,"given":"Wen","family":"Xia","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-9410-3493","authenticated-orcid":false,"given":"Wenxuan","family":"Huang","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-7832-0599","authenticated-orcid":false,"given":"Yanqi","family":"Pan","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8305-2171","authenticated-orcid":false,"given":"Hao","family":"Huang","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology, Shenzhen, China"}]}],"member":"320","published-online":{"date-parts":[[2025,3,30]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2017.187"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.5555\/2813767.2813779"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.5555\/2591272.2591282"},{"volume-title":"Proceedings of the 17th USENIX Conference on File and Storage Technologies (FAST '19)","author":"Cao Zhichao","key":"e_1_3_2_1_4_1","unstructured":"Zhichao Cao, Shiyong Liu, Fenggang Wu, Guohua Wang, Bingzhe Li, and David H. C. Du. 2019. Sliding Look-Back Window Assisted Data Chunk Rewriting for Improving Deduplication Restore Performance. In Proceedings of the 17th USENIX Conference on File and Storage Technologies (FAST '19). 129--142."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2023.3299309"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3472456.3472485"},{"key":"e_1_3_2_1_7_1","volume-title":"The Digitization of the World From Edge to Core. IDC White Paper","author":"David Reinsel John Rydning","year":"2018","unstructured":"John Rydning David Reinsel, John Gantz. 2018. The Digitization of the World From Edge to Core. IDC White Paper (2018), 1--28."},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of the 2010 USENIX Annual Technical Conference (USENIX ATC '10).","author":"Debnath Biplob","year":"2010","unstructured":"Biplob Debnath, Sudipta Sengupta, and Jin Li. 2010. ChunkStash: Speeding Up Inline Storage Deduplication Using Flash Memory. In Proceedings of the 2010 USENIX Annual Technical Conference (USENIX ATC '10)."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2024.3363456"},{"volume-title":"Proceedings of the 15th USENIX Conference on File and Storage Technologies (FAST '17)","author":"Douglis Fred","key":"e_1_3_2_1_10_1","unstructured":"Fred Douglis, Abhinav Duggal, Philip Shilane, Tony Wong, Shiqin Yan, and Fabiano C. Botelho. 2017. The Logic of Physical Garbage Collection in Deduplicating Storage. In Proceedings of the 15th USENIX Conference on File and Storage Technologies (FAST '17). 29--44."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of the 2019 USENIX Annual Technical Conference (USENIX ATC '19). 647--660","author":"Duggal Abhinav","year":"2019","unstructured":"Abhinav Duggal, Fani Jenkins, Philip Shilane, Ramprasad Chinthekindi, Ritesh Shah, and Mahesh Kamat. 2019. Data Domain Cloud Tier: Backup here, backup there, deduplicated everywhere!. In Proceedings of the 2019 USENIX Annual Technical Conference (USENIX ATC '19). 647--660."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2015.2410781"},{"key":"e_1_3_2_1_13_1","unstructured":"John Gilmore Jay Fenlason et al. 1992. GNU tar: an archiver tool. (1992)."},{"key":"e_1_3_2_1_14_1","volume-title":"The State of Data Protection and Disaster Recovery Readiness","author":"Goodwin Phil","year":"2021","unstructured":"Phil Goodwin. 2021. The State of Data Protection and Disaster Recovery Readiness: 2021. IDC White Paper (2021), 1--12."},{"key":"e_1_3_2_1_15_1","volume-title":"The State of Ransomware and Disaster Preparedness","author":"Goodwin Phil","year":"2022","unstructured":"Phil Goodwin. 2022. The State of Ransomware and Disaster Preparedness: 2022. IDC White Paper (2022), 1--12."},{"key":"e_1_3_2_1_16_1","volume-title":"The State of Disaster Recovery and Cyber-Recovery","author":"Goodwin Phil","year":"2024","unstructured":"Phil Goodwin. 2024. The State of Disaster Recovery and Cyber-Recovery, 2024--2025: Factoring in AI. IDC White Paper (2024), 1--21."},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of 2011 USENIX Annual Technical Conference (USENIX ATC '11). 1--14","author":"Guo Fanglu","year":"2011","unstructured":"Fanglu Guo and Petros Efstathopoulos. 2011. Building a High-performance Deduplication System. In Proceedings of 2011 USENIX Annual Technical Conference (USENIX ATC '11). 1--14."},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the 2017 USENIX Annual Technical Conference (USENIX ATC '17). 759--771","author":"Hahn Sangwook Shane","year":"2017","unstructured":"Sangwook Shane Hahn, Sungjin Lee, Cheng Ji, Li-Pin Chang, Inhyuk Yee, Liang Shi, Chun Jason Xue, and Jihong Kim. 2017. Improving File System Performance of Mobile Storage Systems Using a Decoupled Defragmenter. In Proceedings of the 2017 USENIX Annual Technical Conference (USENIX ATC '17). 759--771."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2018.2869737"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.5555\/3026852.3026868"},{"key":"e_1_3_2_1_21_1","volume-title":"Proceedings of the 22nd USENIX Conference on File and Storage Technologies (FAST '24)","author":"Jun Yuhun","year":"2024","unstructured":"Yuhun Jun, Shin-Hyun Park, Jeong-Uk Kang, Sang-Hoon Kim, and Euiseong Seo. 2024. We Ain't Afraid of No File Fragmentation: Causes and Prevention of Its Performance Impact on Modern Flash SSDs. In Proceedings of the 22nd USENIX Conference on File and Storage Technologies (FAST '24). 193--208."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/2741948.2741952"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2024.3511334"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3342195.3387531"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.5555\/2591272.2591292"},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the 7th USENIX Conference on File and Storage Technologies (FAST '09)","author":"Lillibridge Mark","year":"2009","unstructured":"Mark Lillibridge, Kave Eshghi, Deepavali Bhagwat, Vinay Deolalikar, Greg Trezise, and Peter Camble. 2009. Sparse Indexing: Large Scale, Inline Deduplication Using Sampling and Locality. In Proceedings of the 7th USENIX Conference on File and Storage Technologies (FAST '09)."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2078861.2078864"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357223.3362731"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2024.3375792"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2024.3435681"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483593"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD56317.2022.00052"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3492321.3524272"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/2485732.2485753"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3664817"},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the 2012 USENIX Annual Technical Conference (USENIX ATC '12). 261--272","author":"Tarasov Vasily","year":"2012","unstructured":"Vasily Tarasov, Amar Mudrankit, Will Buik, Philip Shilane, Geoff Kuenning, and Erez Zadok. 2012. Generating Realistic Datasets for Deduplication Analysis. In Proceedings of the 2012 USENIX Annual Technical Conference (USENIX ATC '12). 261--272."},{"volume-title":"Purpose-Built Backup Appliance (PBBA): The Ultimate Guide. Veritas White Paper","year":"2024","key":"e_1_3_2_1_37_1","unstructured":"Veritas. 2024. Purpose-Built Backup Appliance (PBBA): The Ultimate Guide. Veritas White Paper (2024), 1--10."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.5555\/2208461.2208465"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD56317.2022.00034"},{"key":"e_1_3_2_1_40_1","volume-title":"A cost-efficient resemblance detection scheme for post-deduplication delta compression in backup systems. Concurrency and Computation: Practice and Experience 34, 3","author":"Wang Chunzhi","year":"2022","unstructured":"Chunzhi Wang, Yanlin Fu, Junyi Yan, Xinyun Wu, Yucheng Zhang, Huiling Xia, and Ye Yuan. 2022. A cost-efficient resemblance detection scheme for post-deduplication delta compression in backup systems. Concurrency and Computation: Practice and Experience 34, 3 (2022)."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2024.3447221"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2018.2852642"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2016.2571298"},{"key":"e_1_3_2_1_44_1","volume-title":"Proceedings of the 7th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage '15)","author":"Xia Wen","year":"2015","unstructured":"Wen Xia, Chunguang Li, Hong Jiang, Dan Feng, Yu Hua, Leihua Qin, and Yucheng Zhang. 2015. Edelta: A Word-Enlarging Based Fast Delta Compression Approach. In Proceedings of the 7th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage '15)."},{"key":"e_1_3_2_1_45_1","volume-title":"Proceedings of the 2016 USENIX Annual Technical Conference (USENIX ATC '16). 101--114","author":"Xia Wen","year":"2016","unstructured":"Wen Xia, Yukun Zhou, Hong Jiang, Dan Feng, Yu Hua, Yuchong Hu, Qing Liu, and Yucheng Zhang. 2016. FastCDC: A Fast and Efficient Content-Defined Chunking Approach for Data Deduplication. In Proceedings of the 2016 USENIX Annual Technical Conference (USENIX ATC '16). 101--114."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD56317.2022.00053"},{"key":"e_1_3_2_1_47_1","volume-title":"Proceedings of the 2023 USENIX Annual Technical Conference (USENIX ATC '23). 133--148","author":"Zhang Yucheng","year":"2023","unstructured":"Yucheng Zhang, Hong Jiang, Dan Feng, Nan Jiang, Taorong Qiu, and Wei Huang. 2023. LoopDelta: Embedding Locality-aware Opportunistic Delta Compression in Inline Deduplication for Highly Efficient Data Reduction. In Proceedings of the 2023 USENIX Annual Technical Conference (USENIX ATC '23). 133--148."},{"key":"e_1_3_2_1_48_1","volume-title":"Proceedings of the 17th USENIX Conference on File and Storage Technologies (FAST '19)","author":"Zhang Yucheng","year":"2019","unstructured":"Yucheng Zhang, Wen Xia, Dan Feng, Hong Jiang, Yu Hua, and Qiang Wang. 2019. Finesse: Fine-Grained Feature Locality based Fast Resemblance Detection for Post-Deduplication Delta Compression. In Proceedings of the 17th USENIX Conference on File and Storage Technologies (FAST '19). 121--128."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.2991030"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/3643819"},{"volume-title":"Proceedings of the 6th USENIX Conference on File and Storage Technologies (FAST '08)","author":"Zhu Benjamin","key":"e_1_3_2_1_51_1","unstructured":"Benjamin Zhu, Kai Li, and R. Hugo Patterson. 2008. Avoiding the Disk Bottleneck in the Data Domain Deduplication File System. In Proceedings of the 6th USENIX Conference on File and Storage Technologies (FAST '08). 269--282."},{"key":"e_1_3_2_1_52_1","volume-title":"Proceedings of the 6th USENIX Conference on File and Storage Technologies (FAST' 08)","volume":"8","author":"Zhu Benjamin","year":"2008","unstructured":"Benjamin Zhu, Kai Li, and R Hugo Patterson. 2008. Avoiding the Disk Bottleneck in the Data Domain Deduplication File System.. In Proceedings of the 6th USENIX Conference on File and Storage Technologies (FAST' 08), Vol. 8. 1--14."},{"key":"e_1_3_2_1_53_1","volume-title":"Proceedings of 2022 USENIX Annual Technical Conference (USENIX ATC '22). 19--36","author":"Zou Xiangyu","year":"2022","unstructured":"Xiangyu Zou, Wen Xia, Philip Shilane, Haijun Zhang, and Xuan Wang. 2022. Building a High-performance Fine-grained Deduplication Framework for Backup Storage with High Deduplication Ratio. In Proceedings of 2022 USENIX Annual Technical Conference (USENIX ATC '22). 19--36."},{"key":"e_1_3_2_1_54_1","volume-title":"Proceedings of the 19th USENIX Conference on File and Storage Technologies (FAST '21)","author":"Zou Xiangyu","year":"2021","unstructured":"Xiangyu Zou, Jingsong Yuan, Philip Shilane, Wen Xia, Haijun Zhang, and Xuan Wang. 2021. The Dilemma between Deduplication and Locality: Can Both be Achieved?. In Proceedings of the 19th USENIX Conference on File and Storage Technologies (FAST '21). 171--185."}],"event":{"name":"EuroSys '25: Twentieth European Conference on Computer Systems","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems"],"location":"Rotterdam Netherlands","acronym":"EuroSys '25"},"container-title":["Proceedings of the Twentieth European Conference on Computer Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3689031.3717493","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3689031.3717493","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T11:17:44Z","timestamp":1755775064000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3689031.3717493"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,30]]},"references-count":54,"alternative-id":["10.1145\/3689031.3717493","10.1145\/3689031"],"URL":"https:\/\/doi.org\/10.1145\/3689031.3717493","relation":{},"subject":[],"published":{"date-parts":[[2025,3,30]]},"assertion":[{"value":"2025-03-30","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}