{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T06:04:20Z","timestamp":1725516260381},"publisher-location":"Berlin, Heidelberg","reference-count":11,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540693833"},{"type":"electronic","value":"9783540693840"}],"license":[{"start":{"date-parts":[[2008,1,1]],"date-time":"2008-01-01T00:00:00Z","timestamp":1199145600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2008]]},"DOI":"10.1007\/978-3-540-69384-0_98","type":"book-chapter","created":{"date-parts":[[2008,7,31]],"date-time":"2008-07-31T06:39:15Z","timestamp":1217486355000},"page":"935-944","source":"Crossref","is-referenced-by-count":2,"title":["Fast and Small Short Vector SIMD Matrix Multiplication Kernels for the Synergistic Processing Element of the CELL Processor"],"prefix":"10.1007","author":[{"given":"Wesley","family":"Alvaro","sequence":"first","affiliation":[]},{"given":"Jakub","family":"Kurzak","sequence":"additional","affiliation":[]},{"given":"Jack","family":"Dongarra","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"98_CR1","unstructured":"IBM Corporation: Cell Broadband Engine Programming Handbook, Version 1.1 (April 2007)"},{"issue":"5","key":"98_CR2","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1109\/MC.2005.160","volume":"38","author":"D. Geer","year":"2005","unstructured":"Geer, D.: Industry Trends: Chip Makers Turn to Multicore Processors. Computer\u00a038(5), 11\u201313 (2005)","journal-title":"Computer"},{"key":"98_CR3","unstructured":"Asanovic, K., Bodik, R., Catanzaro, B.C., Gebis, J.J., Husbands, P., Keutzer, K., Patterson, D.A., Plishker, W.L., Shalf, J., Williams, S.W., Yelick, K.A.: The Landscape of Parallel Computing Research: A View from Berkeley. Technical Report UCB\/EECS-2006-183, Electrical Engineering and Computer Sciences Department, University of California, Berkeley (2006)"},{"key":"98_CR4","doi-asserted-by":"crossref","DOI":"10.1137\/1.9780898719611","volume-title":"Numerical Linear Algebra for High-Performance Computers","author":"J.J. Dongarra","year":"1998","unstructured":"Dongarra, J.J., Duff, I.S., Sorensen, D.C., van der Vorst, H.A.: Numerical Linear Algebra for High-Performance Computers. SIAM, Philadelphia (1998)"},{"key":"98_CR5","doi-asserted-by":"crossref","DOI":"10.1137\/1.9781611971446","volume-title":"Applied Numerical Linear Algebra","author":"J.W. Demmel","year":"1997","unstructured":"Demmel, J.W.: Applied Numerical Linear Algebra. SIAM, Philadelphia (1997)"},{"issue":"3","key":"98_CR6","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1145\/292395.292412","volume":"24","author":"B. K\u00e5gstr\u00f6m","year":"1998","unstructured":"K\u00e5gstr\u00f6m, B., Ling, P., van Loan, C.: GEMM-Based Level 3 BLAS: High-Performance Model Implementations and Performance Evaluation Benchmark. ACM Trans. Math. Soft.\u00a024(3), 268\u2013302 (1998)","journal-title":"ACM Trans. Math. Soft."},{"issue":"2","key":"98_CR7","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1002\/cpe.549","volume":"13","author":"D. Aberdeen","year":"2001","unstructured":"Aberdeen, D., Baxter, J.: Emmerald: A Fast Matrix-Matrix Multiply Using Intel\u2019s SSE Instructions. Concurrency Computat.: Pract. Exper.\u00a013(2), 103\u2013119 (2001)","journal-title":"Concurrency Computat.: Pract. Exper."},{"key":"98_CR8","doi-asserted-by":"crossref","unstructured":"Williams, S., Shalf, J., Oliker, L., Kamil, S., Husbands, P., Yelick, K.: The Potential of the Cell Processor for Scientific Computing. In: ACM International Conference on Computing Frontiers (2006)","DOI":"10.1145\/1128022.1128027"},{"key":"98_CR9","unstructured":"Chen, T., Raghavan, R., Dale, J., Iwata, E.: Cell Broadband Engine architecture and its first implementation, A performance view (November 2005), \n                    \n                      http:\/\/www-128.ibm.com\/developerworks\/power\/library\/pa-cellperf\/"},{"key":"98_CR10","unstructured":"Hackenberg, D.: Einsatz und Leistungsanalyse der Cell Broadband Engine. Institut f\u00fcr Technische Informatik, Fakult\u00e4t Informatik, Technische Universit\u00e4t Dresden, Gro\u00dfer Beleg (February 2007)"},{"key":"98_CR11","unstructured":"Hackenberg, D.: Fast matrix multiplication on CELL systems (July 2007), \n                    \n                      http:\/\/tu-dresden.de\/die_tu_dresden\/zentrale_einrichtungen\/zih\/forschun\/architektur_und_leistungsanalyse_von_hochleistungsrechnern\/cell\/"}],"container-title":["Lecture Notes in Computer Science","Computational Science \u2013 ICCS 2008"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-69384-0_98","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,19]],"date-time":"2019-05-19T15:44:41Z","timestamp":1558280681000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-69384-0_98"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008]]},"ISBN":["9783540693833","9783540693840"],"references-count":11,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-69384-0_98","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2008]]}}}