{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T17:55:33Z","timestamp":1775325333137,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":19,"publisher":"ACM","license":[{"start":{"date-parts":[[2009,11,14]],"date-time":"2009-11-14T00:00:00Z","timestamp":1258156800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2009,11,14]]},"DOI":"10.1145\/1654059.1654078","type":"proceedings-article","created":{"date-parts":[[2009,11,17]],"date-time":"2009-11-17T13:30:15Z","timestamp":1258464615000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":613,"title":["Implementing sparse matrix-vector multiplication on throughput-oriented processors"],"prefix":"10.1145","author":[{"given":"Nathan","family":"Bell","sequence":"first","affiliation":[{"name":"NVIDIA Research"}]},{"given":"Michael","family":"Garland","sequence":"additional","affiliation":[{"name":"NVIDIA Research"}]}],"member":"320","published-online":{"date-parts":[[2009,11,14]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"E. Anderson Z. Bai C. Bischof S. Blackford J. Demmel J. Dongarra J. Du Croz A. Greenbaum S. Hammarling A. McKenney and D. Sorensen. LAPACK Users' Guide. Society for Industrial and Applied Mathematics Philadelphia PA third edition 1999.   E. Anderson Z. Bai C. Bischof S. Blackford J. Demmel J. Dongarra J. Du Croz A. Greenbaum S. Hammarling A. McKenney and D. Sorensen. LAPACK Users' Guide . Society for Industrial and Applied Mathematics Philadelphia PA third edition 1999.","DOI":"10.1137\/1.9780898719604"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-85451-7_79"},{"key":"e_1_3_2_1_5_1","unstructured":"N. Bell and M. Garland. CUSP: Generic parallel algorithms for sparse matrix and graph computations. http:\/\/code.google.com\/p\/cusp-library\/ 2009-.  N. Bell and M. Garland. CUSP: Generic parallel algorithms for sparse matrix and graph computations. http:\/\/code.google.com\/p\/cusp-library\/ 2009-."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1006\/jpdc.1994.1038"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1080\/17445760802337010"},{"key":"e_1_3_2_1_9_1","unstructured":"CUDPP\n\n  \n  : CUDA Data-Parallel Primitives Library. http:\/\/www.gpgpu.org\/developer\/cudpp\/ 2009.  CUDPP: CUDA Data-Parallel Primitives Library. http:\/\/www.gpgpu.org\/developer\/cudpp\/ 2009."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/1391469.1391473"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1177\/1094342004041296"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1137\/S1064827500366124"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/355841.355847"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2008.31"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/1365490.1365500"},{"key":"e_1_3_2_1_17_1","unstructured":"NVIDIA Corporation. NVIDIA CUDA Programming Guide June 2008. Version 2.0.  NVIDIA Corporation. NVIDIA CUDA Programming Guide June 2008. Version 2.0."},{"key":"e_1_3_2_1_18_1","unstructured":"Y. Saad. SPARSKIT: A basic tool kit for sparse computations; Version 2 June 1994.  Y. Saad. SPARSKIT: A basic tool kit for sparse computations; Version 2 June 1994."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.5555\/829576"},{"key":"e_1_3_2_1_20_1","first-page":"97","volume-title":"Graphics Hardware 2007","author":"Sengupta S.","year":"2007"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/1413370.1413402"},{"key":"e_1_3_2_1_22_1","unstructured":"R. W. Vuduc. Automatic Performance Tuning of Sparse Matrix Kernels. PhD thesis University of California Berkeley 2003.   R. W. Vuduc. Automatic Performance Tuning of Sparse Matrix Kernels . PhD thesis University of California Berkeley 2003."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/1362622.1362674"}],"event":{"name":"SC '09: International Conference for High Performance Computing, Networking, Storage and Analysis","location":"Portland Oregon","acronym":"SC '09","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture","IEEE-CS Computer Society"]},"container-title":["Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1654059.1654078","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1654059.1654078","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T12:40:59Z","timestamp":1750250459000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1654059.1654078"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,11,14]]},"references-count":19,"alternative-id":["10.1145\/1654059.1654078","10.1145\/1654059"],"URL":"https:\/\/doi.org\/10.1145\/1654059.1654078","relation":{},"subject":[],"published":{"date-parts":[[2009,11,14]]},"assertion":[{"value":"2009-11-14","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}