{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,21]],"date-time":"2026-04-21T15:27:43Z","timestamp":1776785263620,"version":"3.51.2"},"reference-count":23,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2008,11]]},"DOI":"10.1109\/sc.2008.5214359","type":"proceedings-article","created":{"date-parts":[[2009,8,28]],"date-time":"2009-08-28T10:48:47Z","timestamp":1251456527000},"page":"1-11","source":"Crossref","is-referenced-by-count":427,"title":["Benchmarking GPUs to tune dense linear algebra"],"prefix":"10.1109","author":[{"given":"V.","family":"Volkov","sequence":"first","affiliation":[]},{"given":"J.W.","family":"Demmel","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","year":"0"},{"key":"22","year":"0"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1145\/1362622.1362684"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1145\/1345206.1345220"},{"key":"18","year":"0"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1145\/1188455.1188549"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1145\/1058129.1058148"},{"key":"13","year":"0"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2005.42"},{"key":"11","year":"0"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1145\/77626.79170"},{"key":"21","year":"2008","journal-title":"NVIDIA GeForce GTX 200 GPU Architectural Overview"},{"key":"3","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1109\/SUPERC.1990.129995","article-title":"lapack: a portable linear algebra library for high-performance computers","volume":"90","author":"anderson","year":"1990","journal-title":"Supercomputing"},{"key":"20","year":"2008","journal-title":"NVIDIA CUDA Compute Unified Device Architecture Programming Guide"},{"key":"2","year":"0"},{"key":"1","year":"0"},{"key":"10","year":"0"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1145\/1375527.1375562"},{"key":"6","article-title":"solving dense linear systems on graphics processors","author":"barrachina","year":"2008","journal-title":"Technical Report ICC"},{"key":"5","year":"0"},{"key":"4","article-title":"linpack benchmark optimizations on a virtual processor grid","author":"anderson","year":"2004","journal-title":"Cray User Group 2004 Proceedings"},{"key":"9","year":"0"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-53065-7_101"}],"event":{"name":"2008 SC - International Conference for High Performance Computing, Networking, Storage and Analysis","location":"Austin, TX","start":{"date-parts":[[2008,11,15]]},"end":{"date-parts":[[2008,11,21]]}},"container-title":["2008 SC - International Conference for High Performance Computing, Networking, Storage and Analysis"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/5206875\/5213127\/05214359.pdf?arnumber=5214359","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,18]],"date-time":"2017-06-18T19:16:52Z","timestamp":1497813412000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5214359\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008,11]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/sc.2008.5214359","relation":{},"subject":[],"published":{"date-parts":[[2008,11]]}}}