{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T01:31:32Z","timestamp":1767835892148,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":36,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T00:00:00Z","timestamp":1714176000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,4,27]]},"DOI":"10.1145\/3622781.3674186","type":"proceedings-article","created":{"date-parts":[[2025,4,10]],"date-time":"2025-04-10T15:31:01Z","timestamp":1744299061000},"page":"127-141","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":7,"title":["GUST: Graph Edge-Coloring Utilization for Accelerating Sparse Matrix Vector Multiplication"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-7542-5374","authenticated-orcid":false,"given":"Armin","family":"Gerami","sequence":"first","affiliation":[{"name":"Computer Science, University of Maryland, College Park, MD, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2305-9892","authenticated-orcid":false,"given":"Bahar","family":"Asgari","sequence":"additional","affiliation":[{"name":"Computer Science, University of Maryland, College Park, MD, United States of America"}]}],"member":"320","published-online":{"date-parts":[[2025,4,10]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00080"},{"key":"e_1_3_2_1_2_1","first-page":"1","volume-title":"2021 IEEE International Symposium on Workload Characterization (IISWC)","author":"Asgari Bahar","year":"2021","unstructured":"Bahar Asgari, Ramyad Hadidi, Joshua Dierberger, Charlotte Steinichen, Amaan Marfatia, and Hyesoon Kim. Copernicus: Characterizing the performance implications of compression formats used in sparse workloads. In 2021 IEEE International Symposium on Workload Characterization (IISWC), pages 1--12. IEEE, 2021."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","first-page":"277","DOI":"10.1109\/FPL57034.2022.00049","volume-title":"2022 32nd International Conference on Field-Programmable Logic and Applications (FPL)","author":"Asgari Bahar","year":"2022","unstructured":"Bahar Asgari, Dheeraj Ramchandani, Amaan Marfatia, and Hyesoon Kim. Maia: Matrix inversion acceleration near memory. In 2022 32nd International Conference on Field-Programmable Logic and Applications (FPL), pages 277--281. IEEE, 2022."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/TC.1982.1675982"},{"key":"e_1_3_2_1_5_1","volume-title":"The Future of Computing: Domain-Specific Architecture. https:\/\/www.clsac.org\/uploads\/5\/0\/6\/3\/50633811\/2021-clsacdally.pdf","author":"Dally William","year":"2021","unstructured":"William Dally. The Future of Computing: Domain-Specific Architecture. https:\/\/www.clsac.org\/uploads\/5\/0\/6\/3\/50633811\/2021-clsacdally.pdf, 2021. [Online; accessed May-2023]."},{"key":"e_1_3_2_1_6_1","volume-title":"On the Model of Computation: Point: We Must Extend Our Model of Computation to Account for Cost and Location. https:\/\/cacm.acm.org\/magazines\/2022\/9\/263792-on-the-model-of-computation-point\/abstract","author":"Dally William","year":"2022","unstructured":"William Dally. On the Model of Computation: Point: We Must Extend Our Model of Computation to Account for Cost and Location. https:\/\/cacm.acm.org\/magazines\/2022\/9\/263792-on-the-model-of-computation-point\/abstract, 2022. [Online; accessed May-2023]."},{"key":"e_1_3_2_1_7_1","volume-title":"The university of florida sparse matrix collection. ACM Transactions on Mathematical Software (TOMS), 38(1):1--25","author":"Davis Timothy A","year":"2011","unstructured":"Timothy A Davis and Yifan Hu. The university of florida sparse matrix collection. ACM Transactions on Mathematical Software (TOMS), 38(1):1--25, 2011."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3490422.3502368"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","first-page":"245","DOI":"10.1145\/3470496.3527432","volume-title":"Proceedings of the 49th Annual International Symposium on Computer Architecture","author":"Feng Siying","year":"2022","unstructured":"Siying Feng, Xin He, Kuan-Yu Chen, Liu Ke, Xuan Zhang, David Blaauw, Trevor Mudge, and Ronald Dreslinski. Menda: a near-memory multi-way merge solution for sparse transposition and dataflows. In Proceedings of the 49th Annual International Symposium on Computer Architecture, pages 245--258, 2022."},{"key":"e_1_3_2_1_10_1","first-page":"148","volume-title":"Proceedings of the International Conference on Parallel Architectures and Compilation Techniques, PACT '22","author":"He Xin","year":"2023","unstructured":"Xin He, Kuan-Yu Chen, Siying Feng, Hun-Seok Kim, David Blaauw, Ronald Dreslinski, and Trevor Mudge. Squaring the circle: Executing sparse matrix computations on flextpu---a tpu-like processor. In Proceedings of the International Conference on Parallel Architectures and Compilation Techniques, PACT '22, page 148--159, New York, NY, USA, 2023. Association for Computing Machinery."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3392717.3392751"},{"key":"e_1_3_2_1_12_1","first-page":"1","volume-title":"2021 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)","author":"Hu Yuwei","year":"2021","unstructured":"Yuwei Hu, Yixiao Du, Ecenur Ustun, and Zhiru Zhang. Graphlily: Accelerating graph linear algebra on hbm-equipped fpgas. In 2021 IEEE\/ACM International Conference On Computer Aided Design (ICCAD), pages 1--9. IEEE, 2021."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1109\/FPL50879.2020.00031","volume-title":"2020 30th International conference on field-programmable logic and applications (FPL)","author":"Jain Abhishek Kumar","year":"2020","unstructured":"Abhishek Kumar Jain, Hossein Omidian, Henri Fraisse, Mansimran Benipal, Lisa Liu, and Dinesh Gaitonde. A domain-specific architecture for accelerating sparse matrix vector multiplication on fpgas. In 2020 30th International conference on field-programmable logic and applications (FPL), pages 127--132. IEEE, 2020."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589350"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3140659.3080246"},{"key":"e_1_3_2_1_16_1","first-page":"600","volume-title":"Proceedings of the 52nd Annual IEEE\/ACM International Symposium on Microarchitecture, MICRO '52","author":"Kanellopoulos Konstantinos","year":"2019","unstructured":"Konstantinos Kanellopoulos, Nandita Vijaykumar, Christina Giannoula, Roknoddin Azizi, Skanda Koppula, Nika Mansouri Ghiasi, Taha Shahroodi, Juan Gomez Luna, and Onur Mutlu. Smash: Co-designing software compression and hardware-accelerated indexing for efficient sparse matrix operations. In Proceedings of the 52nd Annual IEEE\/ACM International Symposium on Microarchitecture, MICRO '52, page 600--614, New York, NY, USA, 2019. Association for Computing Machinery."},{"key":"e_1_3_2_1_17_1","first-page":"256","volume-title":"Sparse Matrix Proceedings 1978","volume":"1","author":"Kung Hsiang Tsung","year":"1979","unstructured":"Hsiang Tsung Kung and Charles E Leiserson. Systolic arrays (for vlsi). In Sparse Matrix Proceedings 1978, volume 1, pages 256--282. Society for industrial and applied mathematics Philadelphia, PA, USA, 1979."},{"key":"e_1_3_2_1_18_1","unstructured":"Jure Leskovec and Andrej Krevl. SNAP Datasets: Stanford large network dataset collection. http:\/\/snap.stanford.edu\/data June 2014."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD51958.2021.9643453"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3566097.3567839"},{"key":"e_1_3_2_1_21_1","first-page":"1","volume-title":"2019 IEEE\/ACM International Conference on Computer-Aided Design (ICCAD)","author":"Lu Kai","year":"2019","unstructured":"Kai Lu, Zhaoshi Li, Leibo Liu, Jiawei Wang, Shouyi Yin, and Shaojun Wei. Redesk: A reconfigurable dataflow engine for sparse kernels on heterogeneous platforms. In 2019 IEEE\/ACM International Conference on Computer-Aided Design (ICCAD), pages 1--8. IEEE, 2019."},{"key":"e_1_3_2_1_22_1","first-page":"1","volume-title":"2019 Spring Simulation Conference (SpringSim)","author":"Montagne Euripides","year":"2019","unstructured":"Euripides Montagne and Rina Sur\u00f3s. Systolic sparse matrix vector multiply in the age of tpus and accelerators. In 2019 Spring Simulation Conference (SpringSim), pages 1--10, 2019."},{"key":"e_1_3_2_1_23_1","first-page":"175","volume-title":"Proceedings of the ACM International Conference on Parallel Architectures and Compilation Techniques, PACT '20","author":"Pal Subhankar","year":"2020","unstructured":"Subhankar Pal, Siying Feng, Dong-hyeon Park, Sung Kim, Aporva Amarnath, Chi-Sheng Yang, Xin He, Jonathan Beaumont, Kyle May, Yan Xiong, Kuba Kaszyk, John Magnus Morton, Jiawen Sun, Michael O'Boyle, Murray Cole, Chaitali Chakrabarti, David Blaauw, Hun-Seok Kim, Trevor Mudge, and Ronald Dreslinski. Transmuter: Bridging the efficiency gap using memory and dataflow reconfiguration. In Proceedings of the ACM International Conference on Parallel Architectures and Compilation Techniques, PACT '20, page 175--190, New York, NY, USA, 2020. Association for Computing Machinery."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394885.3431548"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"crossref","first-page":"36","DOI":"10.1109\/EDGE60047.2023.00018","volume-title":"2023 IEEE International Conference on Edge Computing and Communications (EDGE)","author":"Ramchandani Dheeraj","year":"2023","unstructured":"Dheeraj Ramchandani, Bahar Asgari, and Hyesoon Kim. Spica: Exploring fpga optimizations to enable an efficient spmv implementation for computations at edge. In 2023 IEEE International Conference on Edge Computing and Communications (EDGE), pages 36--42. IEEE, 2023."},{"key":"e_1_3_2_1_26_1","first-page":"1","volume-title":"2017 IEEE High Performance Extreme Computing Conference (HPEC)","author":"Sadi Fazle","year":"2017","unstructured":"Fazle Sadi, Larry Fileggi, and Franz Franchetti. Algorithm and hardware co-optimized solution for large spmv problems. In 2017 IEEE High Performance Extreme Computing Conference (HPEC), pages 1--7. IEEE, 2017."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358330"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"crossref","first-page":"51","DOI":"10.1109\/ASAP.2019.00-30","volume-title":"2019 IEEE 30th International Conference on Application-specific Systems, Architectures and Processors (ASAP)","volume":"2160","author":"Sigurbergsson Bj\u00f6rn","year":"2019","unstructured":"Bj\u00f6rn Sigurbergsson, Tom Hogervorst, Tong Dong Qiu, and Razvan Nane. Sparstition: a partitioning scheme for large-scale sparse matrix vector multiplication on fpga. In 2019 IEEE 30th International Conference on Application-specific Systems, Architectures and Processors (ASAP), volume 2160, pages 51--58. IEEE, 2019."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3489517.3530420"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3490422.3502357"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00062"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00061"},{"key":"e_1_3_2_1_33_1","volume-title":"Proceedings of the 51st International Conference on Parallel Processing, ICPP '22","author":"Tang Minjin","year":"2023","unstructured":"Minjin Tang, Mei Wen, Yasong Cao, Junzhong Shen, Jianchao Yang, Jiawei Fei, Yang Guo, and Sheng Liu. Mentha: Enabling sparse-packing computation on systolic arrays. In Proceedings of the 51st International Conference on Parallel Processing, ICPP '22, New York, NY, USA, 2023. Association for Computing Machinery."},{"key":"e_1_3_2_1_34_1","first-page":"9","article-title":"Critical graphs with given chromatic class","volume":"5","author":"Vizing Vadim Georgievich","year":"1965","unstructured":"Vadim Georgievich Vizing. Critical graphs with given chromatic class. Metody Diskret. Analiz., 5: 9--17. (In Russian.), 1965.","journal-title":"Metody Diskret. Analiz."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00055"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00030"}],"event":{"name":"ASPLOS '24: 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 4","location":"Hilton La Jolla Torrey Pines La Jolla CA USA","acronym":"ASPLOS '24","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems","SIGPLAN ACM Special Interest Group on Programming Languages","SIGARCH ACM Special Interest Group on Computer Architecture","SIGBED ACM Special Interest Group on Embedded Systems"]},"container-title":["Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 4"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3622781.3674186","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3622781.3674186","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:37:03Z","timestamp":1750178223000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3622781.3674186"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,27]]},"references-count":36,"alternative-id":["10.1145\/3622781.3674186","10.1145\/3622781"],"URL":"https:\/\/doi.org\/10.1145\/3622781.3674186","relation":{},"subject":[],"published":{"date-parts":[[2024,4,27]]},"assertion":[{"value":"2025-04-10","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}