{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:11:59Z","timestamp":1759133519951},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642314636"},{"type":"electronic","value":"9783642314643"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-31464-3_67","type":"book-chapter","created":{"date-parts":[[2012,7,2]],"date-time":"2012-07-02T15:20:38Z","timestamp":1341242438000},"page":"661-670","source":"Crossref","is-referenced-by-count":11,"title":["Enhancing Parallelism of Tile Bidiagonal Transformation on Multicore Architectures Using Tree Reduction"],"prefix":"10.1007","author":[{"given":"Hatem","family":"Ltaief","sequence":"first","affiliation":[]},{"given":"Piotr","family":"Luszczek","sequence":"additional","affiliation":[]},{"given":"Jack","family":"Dongarra","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"67_CR1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898719604","volume-title":"LAPACK User\u2019s Guide","author":"E. Anderson","year":"1999","unstructured":"Anderson, E., Bai, Z., Bischof, C., Blackford, S.L., Demmel, J.W., Dongarra, J.J., Du Croz, J., Greenbaum, A., Hammarling, S., McKenney, A., Sorensen, D.C.: LAPACK User\u2019s Guide, 3rd edn. Society for Industrial and Applied Mathematics, Philadelphia (1999)","edition":"3"},{"doi-asserted-by":"crossref","unstructured":"Anderson, M., Ballard, G., Demmel, J., Keutzer, K.: Communication-avoiding QR decomposition for GPUs. In: Proceedings of IPDPS 2011, Anchorage, AK USA. ACM (2011)","key":"#cr-split#-67_CR2.1","DOI":"10.1109\/IPDPS.2011.15"},{"unstructured":"Also available as Technical Report UCB\/EECS-2010-131, February 18, 2011 and LAWN 240","key":"#cr-split#-67_CR2.2"},{"unstructured":"Ballard, G., Demmel, J., Dumitriu, I.: Minimizing communication for eigenproblems and the singular value decomposition (2010), arXiv:1011.3077","key":"67_CR3"},{"unstructured":"Balmino, G., Bruinsma, S., Marty, J.-C.: Numerical simulation of the gravity field recovery from GOCE mission data. In: Proceedings of the Second International GOCE User Workshop \u201dGOCE, The Geoid and Oceanography\u201d, March 8-10, ESA-ESRIN, Frascati, Italy (2004)","key":"67_CR4"},{"doi-asserted-by":"crossref","unstructured":"Bientinesi, P., Igual, F., Kressner, D., Quintana-Orti, E.: Reduction to Condensed Forms for Symmetric Eigenvalue Problems on Multi-core Architectures. In: Parallel Processing and Applied Mathemetics, pp. 387\u2013395 (2010)","key":"67_CR5","DOI":"10.1007\/978-3-642-14390-8_40"},{"issue":"4","key":"67_CR6","doi-asserted-by":"publisher","first-page":"602","DOI":"10.1145\/365723.365736","volume":"26","author":"C.H. Bischof","year":"2000","unstructured":"Bischof, C.H., Lang, B., Sun, X.: Algorithm 807: The SBR Toolbox\u2014software for successive band reduction. ACM Trans. Math. Softw.\u00a026(4), 602\u2013616 (2000)","journal-title":"ACM Trans. Math. Softw."},{"doi-asserted-by":"crossref","unstructured":"Bouwmeester, H., Jacquelin, M., Langou, J., Robert, Y.: Tiled QR factorization algorithms. Technical Report RR-7601, INRIA (2011)","key":"67_CR7","DOI":"10.1145\/2063384.2063393"},{"unstructured":"Demmel, J.W., Grigori, L., Hoemmen, M.F., Langou, J.: Communication-optimal parallel and sequential QR and LU factorizations. Technical Report 204, LAPACK Working Note (August 2008)","key":"67_CR8"},{"key":"67_CR9","volume-title":"Matrix Computations","author":"G. Golub","year":"1996","unstructured":"Golub, G., Van Loan, C.: Matrix Computations, 3rd edn. Johns Hopkins University Press, Baltimore (1996)","edition":"3"},{"issue":"3","key":"67_CR10","doi-asserted-by":"publisher","first-page":"799","DOI":"10.1137\/0907053","volume":"7","author":"G.H. Golub","year":"1986","unstructured":"Golub, G.H., Manneback, P., Toint, P.L.: A comparison between some direct and iterative methods for certain large scale geodetic least squares problems. SIAM J. Scientific Computing\u00a07(3), 799\u2013816 (1986)","journal-title":"SIAM J. Scientific Computing"},{"key":"67_CR11","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1007\/BF02163027","volume":"14","author":"G.H. Golub","year":"1970","unstructured":"Golub, G.H., Reinsch, C.: Singular value decomposition and least squares solutions. Numer. Math.\u00a014, 403\u2013420 (1970)","journal-title":"Numer. Math."},{"doi-asserted-by":"crossref","unstructured":"Hadri, B., Ltaief, H., Agullo, E., Dongarra, J.: Tile QR factorization with parallel panel processing for multicore architectures. In: IPDPS, pp. 1\u201310. IEEE (2010)","key":"67_CR12","DOI":"10.1109\/IPDPS.2010.5470443"},{"key":"67_CR13","doi-asserted-by":"crossref","first-page":"417","DOI":"10.1037\/h0071325","volume":"24","author":"H. Hotelling","year":"1933","unstructured":"Hotelling, H.: Analysis of a complex of statistical variables into principal components. J. Educ. Psych.\u00a024, 417\u2013441, 498\u2013520 (1933)","journal-title":"J. Educ. Psych."},{"key":"67_CR14","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1007\/BF02287921","volume":"1","author":"H. Hotelling","year":"1935","unstructured":"Hotelling, H.: Simplified calculation of principal components. Psychometrica\u00a01, 27\u201335 (1935)","journal-title":"Psychometrica"},{"doi-asserted-by":"crossref","unstructured":"Householder, A.S.: Unitary triangularization of a nonsymmetric matrix. Journal of the ACM (JACM)\u00a05(4) (October 1958), doi:10.1145\/320941.320947","key":"67_CR15","DOI":"10.1145\/320941.320947"},{"key":"67_CR16","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1007\/s10543-008-0180-1","volume":"48","author":"B. K\u00e5gstr\u00f6m","year":"2008","unstructured":"K\u00e5gstr\u00f6m, B., Kressner, D., Quintana-Orti, E., Quintana-Orti, G.: Blocked Algorithms for the Reduction to Hessenberg-Triangular Form Revisited. BIT Numerical Mathematics\u00a048, 563\u2013584 (2008)","journal-title":"BIT Numerical Mathematics"},{"unstructured":"Ltaief, H., Luszczek, P., Dongarra, J.: High performance bidiagonal reduction using tile algorithms on homogeneous multicore architectures. Technical report, LAPACK Working Note 247 (2011)","key":"67_CR17"},{"doi-asserted-by":"crossref","unstructured":"Luszczek, P., Ltaief, H., Dongarra, J.: Two-stage tridiagonal reduction for dense symmetric matrices using tile algorithms on multicore architectures. In: Proceedings of IPDPS 2011, Anchorage, AK, USA. ACM (2011)","key":"67_CR18","DOI":"10.1109\/IPDPS.2011.91"},{"doi-asserted-by":"crossref","unstructured":"Moore, B.C.: Principal component analysis in linear systems: Controllability, observability, and model reduction. IEEE Transactions on Automatic Control\u00a0AC-26(1) (February 1981)","key":"67_CR19","DOI":"10.1109\/TAC.1981.1102568"},{"unstructured":"Song, F., Ltaief, H., Hadri, B., Dongarra, J.: Scalable tile communication-avoiding QR factorization on multicore cluster systems. In: Proceedings of SC 2010, New Orleans, Louisiana. ACM (November 2010), Also available as Technical Report UT-CS-10-653 March, 2011 and LAWN 241","key":"67_CR20"},{"issue":"1","key":"67_CR21","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/5992.814658","volume":"2","author":"G.W. Stewart","year":"2000","unstructured":"Stewart, G.W.: The decompositional approach to matrix computation. Computing in Science & Engineering\u00a02(1), 50\u201359 (2000), doi:10.1109\/5992.814658, ISSN: 1521-9615","journal-title":"Computing in Science & Engineering"},{"key":"67_CR22","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898719574","volume-title":"Numerical Linear Algebra","author":"L.N. Trefethen","year":"1997","unstructured":"Trefethen, L.N., Bau, D.: Numerical Linear Algebra. SIAM, Philadelphia (1997), \n                    \n                      http:\/\/www.siam.org\/books\/OT50\/Index.htm"},{"unstructured":"University of Tennessee. PLASMA Users\u2019 Guide, Parallel Linear Algebra Software for Multicore Archtectures, Version 2.2 (November 2009)","key":"67_CR23"},{"unstructured":"YarKhan, A., Kurzak, J., Dongarra, J.: QUARK users\u2019 guide: Queueing and runtime for kernels. Technical Report ICL-UT-11-02, University of Tennessee, Innovative Computing Laboratory (2011)","key":"67_CR24"}],"container-title":["Lecture Notes in Computer Science","Parallel Processing and Applied Mathematics"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-31464-3_67.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,4]],"date-time":"2021-05-04T12:02:28Z","timestamp":1620129748000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-31464-3_67"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642314636","9783642314643"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-31464-3_67","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}