{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:39:30Z","timestamp":1766219970963,"version":"3.48.0"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,9,8]]},"DOI":"10.1145\/3754598.3754617","type":"proceedings-article","created":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:34:32Z","timestamp":1766219672000},"page":"22-32","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Origami: Efficient ML-Driven Metadata Load Balancing for Distributed File Systems"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8787-0134","authenticated-orcid":false,"given":"Yiduo","family":"Wang","sequence":"first","affiliation":[{"name":"China Telecom Cloud Computing Research Institute, Beijing, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6684-4642","authenticated-orcid":false,"given":"Wenda","family":"Tang","sequence":"additional","affiliation":[{"name":"China Telecom Cloud Computing Research Institute, Beijing, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-7384-8529","authenticated-orcid":false,"given":"Linghang","family":"Meng","sequence":"additional","affiliation":[{"name":"China Telecom Cloud Computing Research Institute, Beijing, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2527-5049","authenticated-orcid":false,"given":"Liang","family":"Li","sequence":"additional","affiliation":[{"name":"China Telecom Cloud Computing Research Institute, Beijing, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3472-1717","authenticated-orcid":false,"given":"Jie","family":"Wu","sequence":"additional","affiliation":[{"name":"China Telecom Cloud Computing Research Institute, Beijing, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2025,12,20]]},"reference":[{"key":"e_1_3_3_2_2_2","doi-asserted-by":"publisher","DOI":"10.1109\/UCC.2012.27"},{"key":"e_1_3_3_2_3_2","volume-title":"FAST\u201905","author":"Abd-El-Malek Michael","year":"2005","unstructured":"Michael Abd-El-Malek, William\u00a0V Courtright\u00a0II, Chuck Cranor, et\u00a0al. 2005. Ursa Minor: Versatile Cluster-based Storage.. In FAST\u201905."},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/2159352.2159356"},{"key":"e_1_3_3_2_5_2","unstructured":"A.S.Foundation. 2020. Log files - apache HTTP server version 2.4. https:\/\/httpd.apache.org\/docs\/2.4\/logs.html"},{"key":"e_1_3_3_2_6_2","unstructured":"AWS. 2006. Cloud Object Storage - Amazon S3. https:\/\/aws.amazon.com\/s3\/. Accessed May 1 2025."},{"key":"e_1_3_3_2_7_2","unstructured":"Ceph Community. 2017. CephFS subtree pinning. https:\/\/ceph.io\/community\/new-luminous-cephfs-subtree-pinning\/. Accessed May 1 2025."},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD58817.2023.00051"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"Yuanning Gao Xiaofeng Gao Ruisi Zhang and Guihai Chen. 2021. An end-to-end learning-based metadata management approach for distributed file systems. IEEE TC 71 5 (2021) 1021\u20131034.","DOI":"10.1109\/TC.2021.3070471"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"publisher","DOI":"10.1145\/945445.945450"},{"key":"e_1_3_3_2_11_2","first-page":"915","volume-title":"ATC\u201923","author":"Guo Hao","year":"2023","unstructured":"Hao Guo, Youyou Lu, Wenhao Lv, Xiaojian Liao, Shaoxun Zeng, and Jiwu Shu. 2023. SingularFS: A Billion-Scale Distributed File System Using a Single Metadata Server. In ATC\u201923. 915\u2013928."},{"key":"e_1_3_3_2_12_2","unstructured":"Apache Hadoop. 2006. Hadoop distributed file system. http:\/\/hadoop.apache.org. Accessed May 1 2025."},{"key":"e_1_3_3_2_13_2","unstructured":"Hops Hadoop. 2021. HopsFS 3.2.0.4. https:\/\/github.com\/hopshadoop\/hops\/tree\/3.2.0.4. Accessed May 1 2025."},{"key":"e_1_3_3_2_14_2","unstructured":"Jan Heichler. 2014. An introduction to BeeGFS."},{"key":"e_1_3_3_2_15_2","doi-asserted-by":"crossref","unstructured":"Xiuqi Huang Yuanning Gao Xinyi Zhou et\u00a0al. 2023. An adaptive metadata management scheme based on deep reinforcement learning for large-scale distributed file systems. IEEE\/ACM TON 31 6 (2023) 2840\u20132853.","DOI":"10.1109\/TNET.2023.3266400"},{"key":"e_1_3_3_2_16_2","unstructured":"Guolin Ke Qi Meng Thomas Finley et\u00a0al. 2017. Lightgbm: A highly efficient gradient boosting decision tree. NeurIPS\u201917 30 (2017)."},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330858"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483565"},{"key":"e_1_3_3_2_19_2","volume-title":"ATC\u201908","author":"Leung Andrew\u00a0W","year":"2008","unstructured":"Andrew\u00a0W Leung, Shankar Pasupathy, Garth\u00a0R Goodson, et\u00a0al. 2008. Measurement and Analysis of Large-Scale Network File System Workloads.. In ATC\u201908."},{"key":"e_1_3_3_2_20_2","first-page":"231","volume-title":"FAST\u201923","author":"Li Qiang","year":"2023","unstructured":"Qiang Li, Lulu Chen, Xiaoliang Wang, et\u00a0al. 2023. Fisc: A Large-scale Cloud-native-oriented File System. In FAST\u201923. 231\u2013246."},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/3126908.3126928"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","DOI":"10.1145\/3620678.3624784"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/3299869.3314046"},{"key":"e_1_3_3_2_24_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-55753-3_5"},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2016.49"},{"key":"e_1_3_3_2_26_2","unstructured":"Lustre. 2017. Lustre metadata service. https:\/\/wiki.lustre.org\/Lustre_Metadata_Service_(MDS). Accessed May 1 2025."},{"key":"e_1_3_3_2_27_2","first-page":"313","volume-title":"FAST\u201922","author":"Lv Wenhao","year":"2022","unstructured":"Wenhao Lv, Youyou Lu, Yiming Zhang, et\u00a0al. 2022. InfiniFS: An Efficient Metadata Service for Large-Scale Distributed Filesystems. In FAST\u201922. 313\u2013328."},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3502181.3533711"},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"crossref","unstructured":"Stefano Nembrini Inke\u00a0R K\u00f6nig and Marvin\u00a0N Wright. 2018. The revival of the Gini importance? Bioinformatics 34 21 (2018) 3711\u20133718.","DOI":"10.1093\/bioinformatics\/bty373"},{"key":"e_1_3_3_2_30_2","first-page":"89","volume-title":"FAST\u201917","author":"Niazi Salman","year":"2017","unstructured":"Salman Niazi, Mahmoud Ismail, Seif Haridi, Jim Dowling, Steffen Grohsschmiedt, and Mikael Ronstr\u00f6m. 2017. HopsFS: Scaling hierarchical file system metadata using newsql databases. In FAST\u201917. 89\u2013104."},{"key":"e_1_3_3_2_31_2","first-page":"217","volume-title":"FAST\u201921","author":"Pan Satadru","year":"2021","unstructured":"Satadru Pan, Theano Stavrinos, Yunqiao Zhang, Atul Sikaria, Pavel Zakharov, Abhinav Sharma, Mike Shuey, Richard Wareing, Monika Gangapuram, Guanglei Cao, et\u00a0al. 2021. Facebook\u2019s Tectonic Filesystem: Efficiency from Exascale. In FAST\u201921. 217\u2013231."},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3132747.3132765"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3056100"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2014.25"},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/2807591.2807607"},{"key":"e_1_3_3_2_36_2","unstructured":"Konstantin\u00a0V. Shvachko. 2021. The exabyte club: LinkedIn\u2019s journey of scaling the Hadoop Distributed File System. https:\/\/engineering.linkedin.com\/blog\/2021\/the-exabyte-club-linkedin-s-journey-of-scaling-the-hadoop-distr. Accessed May 1 2025."},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2017.53"},{"key":"e_1_3_3_2_38_2","first-page":"451","volume-title":"Geomatic approaches for modeling land change scenarios","author":"Taud Hind","year":"2017","unstructured":"Hind Taud and Jean-Franccois Mas. 2017. Multilayer perceptron (MLP). In Geomatic approaches for modeling land change scenarios. Springer, 451\u2013455."},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"publisher","unstructured":"Stephen\u00a0R. Walli. 1995. The POSIX family of standards. ACM Stand. 3 1 (1995) 11\u201317. 10.1145\/210308.210315","DOI":"10.1145\/210308.210315"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476196"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/3552326.3587443"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3545008.3545057"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"publisher","DOI":"10.23919\/DATE58400.2024.10546634"},{"key":"e_1_3_3_2_44_2","volume-title":"OSDI\u201906","author":"Weil Sage\u00a0A.","year":"2006","unstructured":"Sage\u00a0A. Weil, Scott\u00a0A. Brandt, Ethan\u00a0L. Miller, Darrell D.\u00a0E. Long, and Carlos Maltzahn. 2006. Ceph: A Scalable, High-Performance Distributed File System. In OSDI\u201906. USENIX Association, Seattle, WA."},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2004.22"},{"key":"e_1_3_3_2_46_2","first-page":"347","volume-title":"FAST\u201924","author":"Wong Daniel Lin-Kit","year":"2024","unstructured":"Daniel Lin-Kit Wong, Hao Wu, Carson Molder, Sathya Gunasekar, Jimmy Lu, Snehal Khandkar, Abhinav Sharma, Daniel\u00a0S Berger, Nathan Beckmann, and Gregory\u00a0R Ganger. 2024. Baleen:ML Admission & Prefetching for Flash Caches. In FAST\u201924. 347\u2013371."},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"publisher","DOI":"10.1145\/1654059.1654086"},{"key":"e_1_3_3_2_48_2","unstructured":"Jingwei Xu Mingkai Dong Qiulin Tian Ziyi Tian Tong Xin and Haibo Chen. 2024. AsyncFS: Metadata Updates Made Asynchronous for Distributed Filesystems with In-Network Coordination. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.08618 (2024)."},{"key":"e_1_3_3_2_49_2","first-page":"115","volume-title":"FAST\u201923","author":"Yang Juncheng","year":"2023","unstructured":"Juncheng Yang, Ziming Mao, Yao Yue, and KV Rashmi. 2023. GL-Cache: Group-level learning for efficient and high-performance caching. In FAST\u201923. 115\u2013134."}],"event":{"name":"ICPP '25: 54th International Conference on Parallel Processing","location":"San Diego CA USA","acronym":"ICPP '25"},"container-title":["Proceedings of the 54th International Conference on Parallel Processing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3754598.3754617","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T08:35:12Z","timestamp":1766219712000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3754598.3754617"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,8]]},"references-count":48,"alternative-id":["10.1145\/3754598.3754617","10.1145\/3754598"],"URL":"https:\/\/doi.org\/10.1145\/3754598.3754617","relation":{},"subject":[],"published":{"date-parts":[[2025,9,8]]},"assertion":[{"value":"2025-12-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}