{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T08:01:43Z","timestamp":1768032103915,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":59,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:00:00Z","timestamp":1755820800000},"content-version":"vor","delay-in-days":75,"URL":"http:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["2104023, 2311875, 2311876, 2326495, 2247060, 2247080, and 2211538"],"award-info":[{"award-number":["2104023, 2311875, 2311876, 2326495, 2247060, 2247080, and 2211538"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"name":"U.S. Department of Energy, Office of Science, Advanced Scientific Computing Research (ASCR)","award":["DE-SC0024559"],"award-info":[{"award-number":["DE-SC0024559"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,8]]},"DOI":"10.1145\/3721145.3725743","type":"proceedings-article","created":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T12:57:17Z","timestamp":1755867437000},"page":"654-669","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Pushing the Limits of GPU Lossy Compression: A Hierarchical Delta Approach"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-8937-4067","authenticated-orcid":false,"given":"Boyuan","family":"Zhang","sequence":"first","affiliation":[{"name":"Indiana University, Bloomington, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7370-6766","authenticated-orcid":false,"given":"Yafan","family":"Huang","sequence":"additional","affiliation":[{"name":"University of Iowa, Iowa City, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9935-5674","authenticated-orcid":false,"given":"Sheng","family":"Di","sequence":"additional","affiliation":[{"name":"Argonne National Laboratory, Lemont, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7382-093X","authenticated-orcid":false,"given":"Fengguang","family":"Song","sequence":"additional","affiliation":[{"name":"Indiana University, Bloomington, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7773-7826","authenticated-orcid":false,"given":"Guanpeng","family":"Li","sequence":"additional","affiliation":[{"name":"University of Iowa, Iowa City, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7890-3934","authenticated-orcid":false,"given":"Franck","family":"Cappello","sequence":"additional","affiliation":[{"name":"Argonne National Laboratory, Lemont, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,8,22]]},"reference":[{"key":"e_1_3_3_2_2_2","unstructured":"[n. d.]. Benchmark of measuring bandwidth of multiple GPU. https:\/\/github.com\/enfiskutensykkel\/multi-gpu-bwtest."},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"crossref","unstructured":"Mark Ainsworth Ozan Tugluk Ben Whitney and Scott Klasky. 2018. Multilevel techniques for compression and reduction of scientific data\u2014the univariate case. Computing and Visualization in Science 19 5 (2018) 65\u201376.","DOI":"10.1007\/s00791-018-00303-9"},{"key":"e_1_3_3_2_4_2","unstructured":"AMD. [n. d.]. HIPIFY. https:\/\/github.com\/ROCm-Developer-Tools\/HIPIFY."},{"key":"e_1_3_3_2_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581784.3607089"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"crossref","unstructured":"Edip Baysal Dan\u00a0D Kosloff and John\u00a0WC Sherwood. 1983. Reverse time migration. Geophysics 48 11 (1983) 1514\u20131524.","DOI":"10.1190\/1.1441434"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"crossref","unstructured":"Franck Cappello Mario Acosta Emmanuel Agullo Hartwig Anzt Jon Calhoun Sheng Di Luc Giraud Thomas Gr\u00fctzmacher Sian Jin Kentaro Sano et\u00a0al. 2025. Multifacets of lossy compression for scientific data in the Joint-Laboratory of Extreme Scale Computing. Future Generation Computer Systems 163 (2025) 107323.","DOI":"10.1016\/j.future.2024.05.022"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS49936.2021.00095"},{"key":"e_1_3_3_2_9_2","unstructured":"Community Earth System Model (CESM) Atmosphere Model. 2019. http:\/\/www.cesm.ucar.edu\/models\/. Online."},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"crossref","unstructured":"Andrew\u00a0W Cook William Cabot and Paul\u00a0L Miller. 2004. The mixing transition in Rayleigh\u2013Taylor instability. Journal of Fluid Mechanics 511 (2004) 333\u2013362.","DOI":"10.1017\/S0022112004009681"},{"key":"e_1_3_3_2_11_2","doi-asserted-by":"crossref","unstructured":"Luis\u00a0Rangel DaCosta Hamish\u00a0G Brown Philipp\u00a0M Pelz Alexander Rakowski Natolya Barber Peter O\u2019Donovan Patrick McBean Lewys Jones Jim Ciston MC Scott et\u00a0al. 2021. Prismatic 2.0\u2013Simulation software for scanning and high resolution transmission electron microscopy (STEM and HRTEM). Micron 151 (2021) 103141.","DOI":"10.1016\/j.micron.2021.103141"},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2016.11"},{"key":"e_1_3_3_2_13_2","unstructured":"Sheng Di Jinyang Liu Kai Zhao Xin Liang Robert Underwood Zhaorui Zhang Milan Shah Yafan Huang Jiajun Huang Xiaodong Yu et\u00a0al. 2024. A Survey on Error-Bounded Lossy Compression for Scientific Datasets. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.02840 (2024)."},{"key":"e_1_3_3_2_14_2","unstructured":"Jack\u00a0J Dongarra Hans\u00a0W Meuer Erich Strohmaier et\u00a0al. 1997. TOP500 supercomputer sites. Supercomputer 13 (1997) 89\u2013111."},{"key":"e_1_3_3_2_15_2","unstructured":"Alex Fallin Noushin Azami Sheng Di Franck Cappello and Martin Burtscher. [n. d.]. Fast and Effective Lossy Compression on GPUs and CPUs with Guaranteed Error Bounds. ([n. d.])."},{"key":"e_1_3_3_2_16_2","unstructured":"Alex Fallin and Martin Burtscher. 2024. Lessons Learned on the Path to Guaranteeing the Error Bound in Lossy Quantizers. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2407.15037 (2024)."},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC41406.2024.00095"},{"key":"e_1_3_3_2_18_2","unstructured":"Jay Gambetta. 2020. IBM\u2019s roadmap for scaling quantum technology. https:\/\/www.ibm.com\/quantum\/blog\/ibm-quantum-roadmap?mhsrc=ibmsearch_a&mhq=condor."},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"crossref","unstructured":"Ray\u00a0W Grout A Gruber H Kolla P-T Bremer JC Bennett A Gyulassy and JH Chen. 2012. A direct numerical simulation study of turbulence and flame structure in transverse jets analysed in jet-trajectory based coordinates. Journal of Fluid Mechanics 706 (2012) 351\u2013383.","DOI":"10.1017\/jfm.2012.257"},{"key":"e_1_3_3_2_20_2","doi-asserted-by":"crossref","unstructured":"Salman Habib Vitali Morozov Nicholas Frontiere Hal Finkel Adrian Pope Katrin Heitmann Kalyan Kumaran Venkatram Vishwanath Tom Peterka Joe Insley et\u00a0al. 2016. HACC: Extreme scaling and performance across diverse architectures. Commun. ACM 60 1 (2016) 97\u2013104.","DOI":"10.1145\/3015569"},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2010.579"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC41406.2024.00021"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581784.3607048"},{"key":"e_1_3_3_2_24_2","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid57682.2023.00066"},{"key":"e_1_3_3_2_25_2","unstructured":"Intel. [n. d.]. SYCLomatic. https:\/\/github.com\/oneapi-src\/SYCLomatic."},{"key":"e_1_3_3_2_26_2","unstructured":"Jinda Jia Cong Xie Hanlin Lu Daoce Wang Hao Feng Chengming Zhang Baixi Sun Haibin Lin Zhi Zhang Xin Liu et\u00a0al. 2024. SDP4Bit: Toward 4-bit Communication Quantization in Sharded Data Parallelism for LLM Training. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.15526 (2024)."},{"key":"e_1_3_3_2_27_2","unstructured":"Wenqi Jia Youyuan Liu Zhewen Hu Jinzhen Wang Boyuan Zhang Wei Niu Junzhou Huang Stavros Kalafatis Sian Jin and Miao Yin. 2024. NeurLZ: On Enhancing Lossy Compression Performance based on Error-Controlled Neural Learning for Scientific Data. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2409.05785 (2024)."},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3431379.3460653"},{"key":"e_1_3_3_2_29_2","unstructured":"P. Klacansky. 2017. Open SciVis Datasets. https:\/\/klacansky.com\/open-scivis-datasets\/."},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/PacificVis53943.2022.00017"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/DCC50243.2021.00018"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476169"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS54959.2023.00104"},{"key":"e_1_3_3_2_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS57955.2024.00040"},{"key":"e_1_3_3_2_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356193"},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2018.8622520"},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"crossref","unstructured":"Xin Liang Ben Whitney Jieyang Chen Lipeng Wan Qing Liu Dingwen Tao James Kress David Pugmire Matthew Wolf Norbert Podhorszki et\u00a0al. 2021. Mgard+: Optimizing multilevel methods for error-bounded scientific data reduction. IEEE Trans. Comput. 71 7 (2021) 1522\u20131536.","DOI":"10.1109\/TC.2021.3092201"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"crossref","unstructured":"Xin Liang Kai Zhao Sheng Di Sihuan Li Robert Underwood Ali\u00a0M Gok Jiannan Tian Junjing Deng Jon\u00a0C Calhoun Dingwen Tao et\u00a0al. 2022. SZ3: A modular framework for composing prediction-based error-bounded lossy compressors. IEEE Transactions on Big Data 9 2 (2022) 485\u2013498.","DOI":"10.1109\/TBDATA.2022.3201176"},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"crossref","unstructured":"Guo-Yuan Lien Takemasa Miyoshi Seiya Nishizawa Ryuji Yoshida Hisashi Yashiro Sachiho\u00a0A Adachi Tsuyoshi Yamaura and Hirofumi Tomita. 2017. The near-real-time SCALE-LETKF system: A case of the September 2015 Kanto-Tohoku heavy rainfall. Sola 13 (2017) 1\u20136.","DOI":"10.2151\/sola.2017-001"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"crossref","unstructured":"Peter Lindstrom. 2014. Fixed-rate compressed floating-point arrays. IEEE transactions on visualization and computer graphics 20 12 (2014) 2674\u20132683.","DOI":"10.1109\/TVCG.2014.2346458"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC41406.2024.00019"},{"key":"e_1_3_3_2_42_2","unstructured":"Duane Merrill and Michael Garland. 2016. Single-pass parallel prefix scan with decoupled look-back. NVIDIA Tech. Rep. NVR-2016-002 (2016)."},{"key":"e_1_3_3_2_43_2","unstructured":"nvCOMP: A library for fast lossless compression\/decompression on the GPU. [n. d.]. https:\/\/github.com\/NVIDIA\/nvcomp."},{"key":"e_1_3_3_2_44_2","unstructured":"NYX simulation. [n. d.]. https:\/\/amrex-astro.github.io\/Nyx\/. Online."},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.1145\/1964179.1964189"},{"key":"e_1_3_3_2_46_2","doi-asserted-by":"crossref","unstructured":"John Preskill. 2018. Quantum computing in the NISQ era and beyond. Quantum 2 (2018) 79.","DOI":"10.22331\/q-2018-08-06-79"},{"key":"e_1_3_3_2_47_2","unstructured":"QMCPACK: many-body ab initio Quantum Monte Carlo code. 2019. http:\/\/vis.computer.org\/vis2004contest\/data.html. Online."},{"key":"e_1_3_3_2_48_2","doi-asserted-by":"publisher","DOI":"10.1145\/3625549.3658691"},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS64566.2025.00084"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2017.115"},{"key":"e_1_3_3_2_51_2","doi-asserted-by":"publisher","DOI":"10.1145\/3410463.3414624"},{"key":"e_1_3_3_2_52_2","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356155"},{"key":"e_1_3_3_2_53_2","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2015.59"},{"key":"e_1_3_3_2_54_2","unstructured":"Zhuoxun Yang Sheng Di Longtao Zhang Ruoyu Li Ximiao Li Jiajun Huang Jinyang Liu Franck Cappello and Kai Zhao. 2025. PSZ: Enhancing the SZ Scientific Lossy Compressor With Progressive Data Retrieval. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2502.04093 (2025)."},{"key":"e_1_3_3_2_55_2","doi-asserted-by":"publisher","DOI":"10.1145\/3502181.3531473"},{"key":"e_1_3_3_2_56_2","unstructured":"Boyuan Zhang Bo Fang Fanjiang Ye Yida Gu Nathan Tallent Guangming Tan and Dingwen Tao. 2024. Overcoming memory constraints in quantum circuit simulation with a high-fidelity compression framework. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.14088 (2024)."},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3710848.3710851"},{"key":"e_1_3_3_2_58_2","doi-asserted-by":"publisher","DOI":"10.1145\/3588195.3592994"},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/3577193.3593706"},{"key":"e_1_3_3_2_60_2","doi-asserted-by":"publisher","DOI":"10.1109\/BigData50022.2020.9378449"}],"event":{"name":"ICS '25: 2025 International Conference on Supercomputing","location":"Salt Lake City USA","acronym":"ICS '25","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 39th ACM International Conference on Supercomputing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3721145.3725743","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3721145.3725743","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T13:03:03Z","timestamp":1755867783000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3721145.3725743"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,8]]},"references-count":59,"alternative-id":["10.1145\/3721145.3725743","10.1145\/3721145"],"URL":"https:\/\/doi.org\/10.1145\/3721145.3725743","relation":{},"subject":[],"published":{"date-parts":[[2025,6,8]]},"assertion":[{"value":"2025-08-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}