{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T16:38:20Z","timestamp":1770741500742,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":14,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,6,23]],"date-time":"2024-06-23T00:00:00Z","timestamp":1719100800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62325405"],"award-info":[{"award-number":["62325405"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62104128"],"award-info":[{"award-number":["62104128"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U19B2019"],"award-info":[{"award-number":["U19B2019"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U21B2031"],"award-info":[{"award-number":["U21B2031"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61832007"],"award-info":[{"award-number":["61832007"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62204164"],"award-info":[{"award-number":["62204164"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,6,23]]},"DOI":"10.1145\/3649329.3657362","type":"proceedings-article","created":{"date-parts":[[2024,11,7]],"date-time":"2024-11-07T19:27:22Z","timestamp":1731007642000},"page":"1-6","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["DySpMM: From Fix to Dynamic for Sparse Matrix-Matrix Multiplication Accelerators"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-7095-7963","authenticated-orcid":false,"given":"Hongyi","family":"Wang","sequence":"first","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8448-9530","authenticated-orcid":false,"given":"Kai","family":"Zhong","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-3889-8688","authenticated-orcid":false,"given":"Haoyu","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1030-3748","authenticated-orcid":false,"given":"Shulin","family":"Zeng","sequence":"additional","affiliation":[{"name":"Tsinghua university, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9259-7180","authenticated-orcid":false,"given":"Zhenhua","family":"Zhu","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9739-2930","authenticated-orcid":false,"given":"Xinhao","family":"Yang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-8449-6092","authenticated-orcid":false,"given":"Shuang","family":"Wang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0849-3252","authenticated-orcid":false,"given":"Guohao","family":"Dai","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2421-353X","authenticated-orcid":false,"given":"Huazhong","family":"Yang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Haidian, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6108-5157","authenticated-orcid":false,"given":"Yu","family":"Wang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,11,7]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"Bulu\u00e7 et al. 2011. The Combinatorial BLAS: Design Implementation and Applications. Int. J. High Perform. Comput. Appl. (2011).","DOI":"10.1177\/1094342011403516"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"Yuze Chi et al. 2021. Extending High-Level Synthesis for Task-Parallel Programs. In FCCM. 204--213.","DOI":"10.1109\/FCCM51124.2021.00032"},{"key":"e_1_3_2_1_3_1","volume-title":"Davis et al","author":"Timothy A.","year":"2011","unstructured":"Timothy A. Davis et al. 2011. The University of Florida Sparse Matrix Collection. ACM Trans. Math. Softw., Article 1 (dec 2011), 25 pages."},{"key":"e_1_3_2_1_4_1","unstructured":"Yixiao Du et al. 2022. High-Performance Sparse Linear Algebra on HBM-Equipped FPGAs Using HLS: A Case Study on SpMV. (2022)."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Jeremy Fowers et al. 2014. A high memory bandwidth fpga accelerator for sparse matrix-vector multiplication. In FCCM.","DOI":"10.1109\/FCCM.2014.23"},{"key":"e_1_3_2_1_6_1","volume-title":"Hamilton et al","author":"William L.","year":"2017","unstructured":"William L. Hamilton et al. 2017. Inductive Representation Learning on Large Graphs. In NIPS."},{"key":"e_1_3_2_1_7_1","unstructured":"Yuwei Hu et al. 2021. GraphLily: Accelerating Graph Linear Algebra on HBM-Equipped FPGAs. In ICCAD."},{"key":"e_1_3_2_1_8_1","volume-title":"Ge-spmm: General-purpose sparse matrix-matrix multiplication on gpus for graph neural networks. In SC.","author":"Guyue Huang","year":"2020","unstructured":"Guyue Huang et al. 2020. Ge-spmm: General-purpose sparse matrix-matrix multiplication on gpus for graph neural networks. In SC."},{"key":"e_1_3_2_1_9_1","unstructured":"Maxim Naumov et al. 2019. Deep Learning Recommendation Model for Personalization and Recommendation Systems. CoRR (2019)."},{"key":"e_1_3_2_1_10_1","unstructured":"Nvidia. 2022. https:\/\/docs.nvidia.com\/cuda\/cusparse\/index.html."},{"key":"e_1_3_2_1_11_1","volume-title":"Sextans: A Streaming Accelerator for General-Purpose Sparse-Matrix Dense-Matrix Multiplication. FPGA","author":"Linhao Song","year":"2021","unstructured":"Linhao Song et al. 2021. Sextans: A Streaming Accelerator for General-Purpose Sparse-Matrix Dense-Matrix Multiplication. FPGA (2021)."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"Hanrui Wang et al. 2020. GCN-RL Circuit Designer: Transferable Transistor Sizing with Graph Neural Networks and Reinforcement Learning. CoRR (2020).","DOI":"10.1109\/DAC18072.2020.9218757"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Hanrui Wang et al. 2021. SpAtten: Efficient Sparse Attention Architecture with Cascade Token and Head Pruning. HPCA (2021) 97--110.","DOI":"10.1109\/HPCA51647.2021.00018"},{"key":"e_1_3_2_1_14_1","volume-title":"Shuhai: Benchmarking high bandwidth memory on fpgas","author":"Zeke Wang","year":"2020","unstructured":"Zeke Wang et al. 2020. Shuhai: Benchmarking high bandwidth memory on fpgas. In FCCM. IEEE."}],"event":{"name":"DAC '24: 61st ACM\/IEEE Design Automation Conference","location":"San Francisco CA USA","acronym":"DAC '24","sponsor":["SIGDA ACM Special Interest Group on Design Automation","IEEE-CEDA","SIGBED ACM Special Interest Group on Embedded Systems"]},"container-title":["Proceedings of the 61st ACM\/IEEE Design Automation Conference"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3649329.3657362","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3649329.3657362","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:01Z","timestamp":1750295881000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3649329.3657362"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,23]]},"references-count":14,"alternative-id":["10.1145\/3649329.3657362","10.1145\/3649329"],"URL":"https:\/\/doi.org\/10.1145\/3649329.3657362","relation":{},"subject":[],"published":{"date-parts":[[2024,6,23]]},"assertion":[{"value":"2024-11-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}