{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:08:42Z","timestamp":1755907722363,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":41,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T00:00:00Z","timestamp":1732060800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-sa\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100006374","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2023YFB4502902"],"award-info":[{"award-number":["2023YFB4502902"]}],"id":[{"id":"10.13039\/501100006374","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,11,20]]},"DOI":"10.1145\/3698038.3698526","type":"proceedings-article","created":{"date-parts":[[2024,11,14]],"date-time":"2024-11-14T06:32:43Z","timestamp":1731565963000},"page":"883-897","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["A Data Optimizer for Region-Aware Self-describing Files in Scientific Computing"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6317-8461","authenticated-orcid":false,"given":"Yanjie","family":"Song","sequence":"first","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-1820-0828","authenticated-orcid":false,"given":"Tianyuan","family":"Wu","sequence":"additional","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-0955-2000","authenticated-orcid":false,"given":"Yuanhao","family":"Li","sequence":"additional","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9509-2635","authenticated-orcid":false,"given":"Guancheng","family":"Li","sequence":"additional","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8137-794X","authenticated-orcid":false,"given":"Yuchen","family":"Liu","sequence":"additional","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6500-1790","authenticated-orcid":false,"given":"Shu","family":"Yin","sequence":"additional","affiliation":[{"name":"School of Info. Sci. &amp; Tech., ShanghaiTech University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9740-6581","authenticated-orcid":false,"given":"Wei","family":"Xue","sequence":"additional","affiliation":[{"name":"Dept. of Computer Sci. and Tech., Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2171-661X","authenticated-orcid":false,"given":"Junchao","family":"Wang","sequence":"additional","affiliation":[{"name":"China Meteorological Administration, Basin Heavy Rainfall Key Lab\/Hubei Key Lab for HV. Rain Mtrg. &amp; WRNG., Wuhan, Hubei, China"}]}],"member":"320","published-online":{"date-parts":[[2024,11,20]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2022. Community Earth System Model CESM. https:\/\/www.cesm.ucar.edu\/. Accessed: 2022-1-1."},{"key":"e_1_3_2_1_2_1","unstructured":"2022. GROMACS. https:\/\/www.gromacs.org\/. Accessed: 2022-9-20."},{"key":"e_1_3_2_1_3_1","unstructured":"2022. Large-scale Atomic\/Molecular Massively Parallel Simulator LAMMPS. https:\/\/www.lammps.org\/. Accessed: 2022-1-1."},{"key":"e_1_3_2_1_4_1","unstructured":"2022. Weather Research and Forecasting model WRF. https:\/\/ral.ucar.edu\/solutions\/products\/weather-research-and-forecasting-model-wrf. Accessed: 2022-1-1."},{"volume-title":"14th USENIX Conference on File and Storage Technologies (FAST) 16)","author":"Andersen Michael P","key":"e_1_3_2_1_5_1","unstructured":"Michael P Andersen and David E Culler. 016. Btrdb: Optimizing storage system design for timeseries processing. In 14th USENIX Conference on File and Storage Technologies (FAST) 16). 39--52."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.softx.2020.100550"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1107\/S1600576714007626"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/COM.Geo.2014.1"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/1654059.1654081"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2612185"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2011.86"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2013.6702675"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2014.6968765"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2015.7363778"},{"key":"e_1_3_2_1_15_1","unstructured":"F. Alted M. Durant S. Hoyer J. Kirkham A. Miles M. Ratsimbazafy M. Rocklin V. Schut A. Scopatz and P. Goel. 2022. Zarr. https:\/\/zarr.readthedocs.io\/. Accessed: 2021-12-31."},{"key":"e_1_3_2_1_16_1","volume-title":"Proceedings of supercomputing","volume":"99","author":"Folk Mike","year":"1999","unstructured":"Mike Folk, Albert Cheng, and Kim Yates. 1999. HDF5: A file format and I\/O library for high performance computing applications. In Proceedings of supercomputing, Vol. 99. 5--33."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1966895.1966900"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTR.2009.5289153"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.softx.2020.100561"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/SSDBM.2006.27"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ascom.2015.06.004"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.newast.2015.06.003"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2018.2831689"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1002\/2016MS000656"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/1048935.1050189"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/1383529.1383533"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1107\/S1600576716007469"},{"volume-title":"A plugin for hdf5 using plfs for improved i\/o performance and semantic analysis. In 2012 SC Companion: High Performance Computing, Networking Storage and Analysis","author":"Mehta Kshitij","key":"e_1_3_2_1_28_1","unstructured":"Kshitij Mehta, John Bent, Aaron Torres, Gary Grider, and Edgar Gabriel. 2012. A plugin for hdf5 using plfs for improved i\/o performance and semantic analysis. In 2012 SC Companion: High Performance Computing, Networking Storage and Analysis. IEEE, 746--752."},{"key":"e_1_3_2_1_29_1","volume-title":"Universit\u00e9 Libre de Bruxelles 12","author":"Zehra Naqvi Syeda Noor","year":"2017","unstructured":"Syeda Noor Zehra Naqvi, Sofia Yfantidou, and Esteban Zim\u00e1nyi. 2017. Time series databases and influxdb. Studienarbeit, Universit\u00e9 Libre de Bruxelles 12 (2017)."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357526.3357568"},{"key":"e_1_3_2_1_31_1","volume-title":"NetCDF: an interface for scientific data access","author":"Rew Russ","year":"1990","unstructured":"Russ Rew and Glenn Davis. 1990. NetCDF: an interface for scientific data access. IEEE computer graphics and applications 10, 4 (1990), 76--82."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid.2016.15"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/FMPC.1999.750599"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/2063384.2063409"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2021.3100784"},{"key":"e_1_3_2_1_36_1","unstructured":"Donald Carson Wells and Eric W Greisen. 1979. FITS-a flexible image transport system. In Image Processing in Astronomy. 445."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1002\/2017JD027008"},{"key":"e_1_3_2_1_38_1","volume-title":"SC20: International Conference for High Performance Computing, Networking, Storage and Analysis. IEEE, 1--15","author":"Zhang Jian","year":"2020","unstructured":"Jian Zhang, Tao Xie, Yuzhuo Jing, Yanjie Song, Guanzhou Hu, Si Chen, and Shu Yin. 2020. BORA: a bag optimizer for robotic analysis. In SC20: International Conference for High Performance Computing, Networking, Storage and Analysis. IEEE, 1--15."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.21105\/joss.01370"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356146"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/GEOINFORMATICS.2014.6950846"}],"event":{"name":"SoCC '24: ACM Symposium on Cloud Computing","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"],"location":"Redmond WA USA","acronym":"SoCC '24"},"container-title":["Proceedings of the ACM Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3698038.3698526","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3698038.3698526","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T19:00:08Z","timestamp":1755889208000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3698038.3698526"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,20]]},"references-count":41,"alternative-id":["10.1145\/3698038.3698526","10.1145\/3698038"],"URL":"https:\/\/doi.org\/10.1145\/3698038.3698526","relation":{},"subject":[],"published":{"date-parts":[[2024,11,20]]},"assertion":[{"value":"2024-11-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}