{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T16:00:41Z","timestamp":1725897641229},"publisher-location":"Berlin, Heidelberg","reference-count":16,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642368028"},{"type":"electronic","value":"9783642368035"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-36803-5_22","type":"book-chapter","created":{"date-parts":[[2013,2,11]],"date-time":"2013-02-11T06:05:03Z","timestamp":1360562703000},"page":"309-318","source":"Crossref","is-referenced-by-count":0,"title":["Numprof: A Performance Analysis Framework for Numerical Libraries"],"prefix":"10.1007","author":[{"given":"Olli-Pekka","family":"Lehto","sequence":"first","affiliation":[]}],"member":"297","reference":[{"key":"22_CR1","first-page":"117","volume":"14","author":"J.J. Dongarra","year":"1986","unstructured":"Dongarra, J.J., Croz, J.D., Hammarling, S., Hanson, R.J.: An extended set of Fortran basic linear algebra subprograms. ACM Transactions on Mathematical Software\u00a014, 117 (1986)","journal-title":"ACM Transactions on Mathematical Software"},{"key":"22_CR2","doi-asserted-by":"crossref","unstructured":"Frigo, M., Johnson, S.G.: The design and implementation of fftw3. In: Proceedings of the IEEE, pp. 216\u2013231 (2005)","DOI":"10.1109\/JPROC.2004.840301"},{"key":"22_CR3","doi-asserted-by":"crossref","unstructured":"Graham, S.L., Kessler, P.B., McKusick, M.K.: gprof: a call graph execution profiler (1982)","DOI":"10.1145\/800230.806987"},{"key":"22_CR4","unstructured":"Myers, D.S., Bazinet, A.L.: Intercepting arbitrary functions on Windows, UNIX, and Macintosh OS X platforms. Institute for Advanced Computer Studies. University of Maryland, CS-TR-4585, UMIACS-TR-2004-28 (2004)"},{"key":"22_CR5","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1145\/1374596.1374609","volume-title":"Proceedings of the 2nd International Workshop on Petascale Data Storage: held in Conjunction with Supercomputing 2007 (PDSW 2007)","author":"P.C. Roth","year":"2007","unstructured":"Roth, P.C.: Characterizing the i\/o behavior of scientific applications on the cray xt. In: Proceedings of the 2nd International Workshop on Petascale Data Storage: held in Conjunction with Supercomputing 2007 (PDSW 2007), pp. 50\u201355. ACM, New York (2007)"},{"key":"22_CR6","unstructured":"Sunderland, A., Pickles, S., Nikolic, M., Jovic, A., Jakic, J., Slavnic, V., Girotto, I., Nash, P., Lysaght, M.: An Analysis of FFT Performance in PRACE Application Codes, PRACE whitepaper (2012)"},{"key":"22_CR7","unstructured":"Benchmarking Single- and Multi-Core BLAS Implementations and GPUs for use with R, \n                    \n                      http:\/\/cran.r-project.org\/web\/packages\/gcbd\/vignettes\/gcbd.pdf"},{"key":"22_CR8","unstructured":"Boisvert, R.F., Boisvert, R.F., Pozo, R., Pozo, R., Remington, K.A., Remington, K.A.: The matrix market exchange formats: Initial design. NISTIR, 5935"},{"key":"22_CR9","doi-asserted-by":"crossref","unstructured":"Vetter, J.S., Mueller, F.: Communication characteristics of large-scale scientific applications for contemporary cluster architectures. In: International Parallel and Distributed Processing Symposium (2002)","DOI":"10.1109\/IPDPS.2002.1015504"},{"key":"22_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1007\/978-3-642-19328-6_10","volume-title":"High Performance Computing for Computational Science \u2013 VECPAR 2010","author":"R. Nath","year":"2011","unstructured":"Nath, R., Tomov, S., Dongarra, J.: Accelerating GPU Kernels for Dense Linear Algebra. In: Palma, J.M.L.M., Dayd\u00e9, M., Marques, O., Lopes, J.C. (eds.) VECPAR 2010. LNCS, vol.\u00a06449, pp. 83\u201392. Springer, Heidelberg (2011)"},{"key":"22_CR11","unstructured":"NVidia CUDA FFT Library, \n                    \n                      http:\/\/developer.nvidia.com\/cuda\/cufft"},{"key":"22_CR12","unstructured":"NVidia CUDA BLAS Library, \n                    \n                      http:\/\/developer.nvidia.com\/cublas"},{"key":"22_CR13","first-page":"2","volume-title":"Proceedings of the 1990 ACM\/IEEE Conference on Supercomputing, Supercomputing 1990","author":"E. Anderson","year":"1990","unstructured":"Anderson, E., Bai, Z., Dongarra, J., Greenbaum, A., McKenney, A., Du Croz, J., Hammerling, S., Demmel, J., Bischof, C., Sorensen, D.: Lapack: a portable linear algebra library for high-performance computers. In: Proceedings of the 1990 ACM\/IEEE Conference on Supercomputing, Supercomputing 1990, pp. 2\u201311. IEEE Computer Society Press, Los Alamitos (1990)"},{"key":"22_CR14","unstructured":"Simpson, A.D., Bull, M., Hill, J.: Identification and Categorisation of Applications and Initial Benchmarks Suite. PRACE Technical Report (2008)"},{"issue":"3","key":"22_CR15","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1177\/109434200001400303","volume":"14","author":"S. Browne","year":"2000","unstructured":"Browne, S., Dongarra, J., Garner, N., Ho, G., Mucci, P.: A Portable Programming Interface for Performance Evaluation on Modern Processors. International Journal of High Performance Computing Applications\u00a014(3), 189\u2013204 (2000) (Fall)","journal-title":"International Journal of High Performance Computing Applications"},{"key":"22_CR16","unstructured":"Koziol, Q., Matzke, R.: HDF5 - A New Generation of HDF: Reference Manual and User\u2019s Guide. NCSA (1998)"}],"container-title":["Lecture Notes in Computer Science","Applied Parallel and Scientific Computing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-36803-5_22","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,11]],"date-time":"2019-05-11T01:35:05Z","timestamp":1557538505000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-36803-5_22"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642368028","9783642368035"],"references-count":16,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-36803-5_22","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2013]]}}}