{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T10:06:43Z","timestamp":1743156403874,"version":"3.40.3"},"publisher-location":"Cham","reference-count":45,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319065472"},{"type":"electronic","value":"9783319065489"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-06548-9_3","type":"book-chapter","created":{"date-parts":[[2014,7,3]],"date-time":"2014-07-03T08:32:46Z","timestamp":1404376366000},"page":"45-67","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Batch Matrix Exponentiation"],"prefix":"10.1007","author":[{"given":"M. Graham","family":"Lopez","sequence":"first","affiliation":[]},{"given":"Mitchel D.","family":"Horton","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,6,9]]},"reference":[{"key":"3_CR1","unstructured":"AMD Core Math Library (ACML): www.amd.com\/acml. Cited 16 Dec 2013"},{"key":"3_CR2","doi-asserted-by":"publisher","DOI":"10.1016\/S0045-7825(99)00242X","author":"P.R. Amestoy","year":"2000","unstructured":"Amestoy, P.R., Duff, I.S., L\u2019Excellent, J.Y.: Multifrontal parallel distributed symmetric and unsymmetric solvers. Comput. Methods Appl. Mech. Eng. (2000). doi: 10.1016\/S0045-7825(99)00242X","journal-title":"Comput. Methods Appl. Mech. Eng."},{"key":"3_CR3","doi-asserted-by":"crossref","unstructured":"Anderson, E., Bai, Z., Bischof, C., Blackford, L.S., Demmel, J.W., Dongarra, J.J., Du Croz, J., Greenbaum, A., Hamarling, S., McKenney, A., Sorensen, D.: LAPACK Users\u2019 Guide. SIAM (1992). http:\/\/www.netlib.org\/lapack\/lug\/. Cited 16 Dec 2013","DOI":"10.2172\/5604546"},{"issue":"1","key":"3_CR4","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1093\/sysbio\/syr100","volume":"61","author":"D.L. Ayres","year":"2012","unstructured":"Ayres, D.L., Darling, A., Zwickl, D.J., Beerli, P., Holder, M.T., Lewis, P.O., Huelsenbeck, J.P., Ronquist, F., Swofford, D.L., Cummings, M.P., Rambaut, A., Suchard, M.A.: BEAGLE: an application programming interface and high-performance computing library for statistical phylogenetics. Syst. Biol. 61(1), 170\u2013173 (2012)","journal-title":"Syst. Biol."},{"key":"3_CR5","unstructured":"Basic Linear Algebra Technical Forum: http:\/\/www.netlib.org\/blas\/blast-forum\/blas-report.pdf. Cited 16 Dec 2013"},{"key":"3_CR6","doi-asserted-by":"crossref","unstructured":"Blackford, L.S., Choi, J., Cleary, A., D\u2019Azevodo, E., Demmel, J., Dhillon, I., Dongarra, J.J., Hammarling, S., Henry, G., Petitet, A., Stanley, K., Walker, D., Whaley, R.C.: ScaLAPACK Users\u2019 Guide. SIAM (1997). http:\/\/www.netlib.org\/scalapack\/slug\/. Cited 16 Dec 2013","DOI":"10.1137\/1.9780898719642"},{"key":"3_CR7","unstructured":"CUBLAS: https:\/\/developer.nvidia.com\/cuBLAS. Cited 16 Dec 2013"},{"key":"3_CR8","unstructured":"CUBLAS Documentation: http:\/\/docs.nvidia.com\/cuda\/cublas\/. Cited 16 Dec 2013"},{"key":"3_CR9","unstructured":"CUDA C Programming Guide: http:\/\/docs.nvidia.com\/cuda\/cuda-c-programming-guide\/index.html. Cited 16 Dec 2013"},{"key":"3_CR10","unstructured":"CUDA Toolkit Documentation: http:\/\/docs.nvidia.com\/cuda\/cuda-samples\/. Cited 16 Dec 2013"},{"key":"3_CR11","unstructured":"CULA Tools: http:\/\/www.culatools.com\/blog\/2011\/12\/09\/batched-operations\/. Cited 16 Dec 2013"},{"key":"3_CR12","doi-asserted-by":"crossref","unstructured":"Demmel, J., Volkov, V.: Benchmarking GPUs to tune dense linear algebra. In: Proceedings of the 2008 ACM\/IEEE Conference on Supercomputing, vol. 31. IEEE Press, Piscataway (2008)","DOI":"10.1109\/SC.2008.5214359"},{"key":"3_CR13","doi-asserted-by":"publisher","DOI":"10.1137\/S0895479895291765","author":"J.W. Demmel","year":"1999","unstructured":"Demmel, J.W., Eisenstat, S.C., Gilbert, J.R., Li, X.S., Liu, J.W.H.: A supernodal approach to sparse partial pivoting. SIAM J. Matrix Anal. Appl. (1999). doi: 10.1137\/S0895479895291765","journal-title":"SIAM J. Matrix Anal. Appl."},{"key":"3_CR14","volume-title":"LAPACK working note 280: On Algorithmic Variants of Parallel Gaussian Elimination: Comparison of Implementations in Terms of Performance and Numerical Properties","author":"S. Donfack","year":"2013","unstructured":"Donfack, S., Dongarra, J., Faverge, M., Gates, M., Kurzak, J., Luszczek, P., Yamzaki, I.: LAPACK working note 280: On Algorithmic Variants of Parallel Gaussian Elimination: Comparison of Implementations in Terms of Performance and Numerical Properties. Innovative Computing Laboratory, University of Tennessee, Knoxville (2013)"},{"key":"3_CR15","volume-title":"Hydrodynamic Computation with Hybrid Programming on CPU-GPU Clusters","author":"T. Dong","year":"2013","unstructured":"Dong, T., Dovrev, V., Kolev, T., Rieben, R., Tomov, S., Dongarra, J.: Hydrodynamic Computation with Hybrid Programming on CPU-GPU Clusters. Innovative Computing Laboratory, University of Tennessee (2013)"},{"key":"3_CR16","doi-asserted-by":"publisher","DOI":"10.1002\/cpe.728","author":"J.J. Dongarra","year":"2003","unstructured":"Dongarra, J.J., Luszczek, P., Petitet, A.: The LINPACK benchmark: past, present and future. Concurr. Comput. Pract. Exp. (2003). doi: 10.1002\/cpe.728","journal-title":"Concurr. Comput. Pract. Exp."},{"key":"3_CR17","doi-asserted-by":"publisher","first-page":"214","DOI":"10.1186\/1471-2148-7-214","volume":"7","author":"A. Drummond","year":"2007","unstructured":"Drummond, A., Rambaut, A.: BEAST: Bayesian evolutionary analysis by sampling trees. BMC Evol. Biol. 7, 214 (2007)","journal-title":"BMC Evol. Biol."},{"key":"3_CR18","doi-asserted-by":"crossref","unstructured":"Drummond, A., Suchard, M., Xie, D., Rambaut, A.: Bayesian phylogenetics with BEAUti and the BEAST 1.7. Mol. Biol. Evol. 29(8), 1969\u20131973 (2012)","DOI":"10.1093\/molbev\/mss075"},{"key":"3_CR19","volume-title":"Biological Sequence Analysis: Probabilistic Models of Proteins and Nucleic Acids","author":"R. Durbin","year":"1997","unstructured":"Durbin, R., Eddy, S., Mitchison, G.: Biological Sequence Analysis: Probabilistic Models of Proteins and Nucleic Acids, 1st edn. Cambridge University Press, Cambridge (1997)","edition":"1"},{"key":"3_CR20","doi-asserted-by":"publisher","first-page":"368","DOI":"10.1007\/BF01734359","volume":"17","author":"J. Felsenstein","year":"1981","unstructured":"Felsenstein, J.: Evolutionary trees from DNA sequences: a maximum likelihood approach. J. Mol. Evol. 17, 368\u2013376 (1981)","journal-title":"J. Mol. Evol."},{"key":"3_CR21","volume-title":"Inferring Phylogenies","author":"J. Felsenstein","year":"2003","unstructured":"Felsenstein, J.: Inferring Phylogenies. Sinauer Associates, Sunderland (2003)"},{"key":"3_CR22","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1016\/S0743-7315(03)00079-0","volume":"63","author":"X. Feng","year":"2003","unstructured":"Feng, X., Buell, D., Rose, J., Waddell, P.: Parallel algorithms for Bayesian phylogenetic inference. J. Parallel Distrib. Comput. 63, 707\u2013718 (2003)","journal-title":"J. Parallel Distrib. Comput."},{"key":"3_CR23","doi-asserted-by":"crossref","unstructured":"Feng, X., Cameron, K., Sosa, C., Smith, B.: Building the tree of life on terascale systems. In: Parallel Distributed Processing Symposium (IPDPS 2007), Washington (2007)","DOI":"10.1109\/IPDPS.2007.370214"},{"key":"3_CR24","unstructured":"GoToBLAS: Texas Advanced Computing Center. http:\/\/www.tacc.utexas.edu\/. Cited 16 Dec 2013"},{"issue":"2","key":"3_CR25","doi-asserted-by":"publisher","first-page":"160","DOI":"10.1007\/BF02101694","volume":"22","author":"M. Hasegawa","year":"1985","unstructured":"Hasegawa, M., Kishino, H., Yano, T.: Dating of the human-ape splitting by a molecular clock of mitochondrial DNA. J. Mol. Evol. 22(2), 160\u2013174 (1985)","journal-title":"J. Mol. Evol."},{"key":"3_CR26","doi-asserted-by":"publisher","first-page":"754","DOI":"10.1093\/bioinformatics\/17.8.754","volume":"17","author":"J.P. Huelsenbeck","year":"2001","unstructured":"Huelsenbeck, J.P., Ronquist, F.: MrBayes: Bayesian inference of phylogenetic trees. Bioinformatics 17, 754\u2013755 (2001)","journal-title":"Bioinformatics"},{"issue":"5550","key":"3_CR27","doi-asserted-by":"publisher","first-page":"2310","DOI":"10.1126\/science.1065889","volume":"294","author":"J.P. Huelsenbeck","year":"2001","unstructured":"Huelsenbeck, J.P., Ronquist, F., Nielsen, R., Bollback, J.P.: Bayesian inference of phylogeny and its impact on evolutionary biology. Science 294(5550), 2310\u20132314 (2001)","journal-title":"Science"},{"key":"3_CR28","unstructured":"IBM: Engineering and Scientific Subroutine Library (ESSL) and parallel ESSL. http:\/\/www-03.ibm.com\/systems\/p\/software\/essl. Cited 16 Dec 2013"},{"key":"3_CR29","unstructured":"Jhurani, C., Mullowney, P.: A GEMM interface and implementation on NVIDIA GPUs for multiple small matrices. www.ices.utexas.edu\/$\\char126$chetan\/preprints\/2013-CJ-PM-GEMM.pdf. Cited 16 Dec 2013"},{"key":"3_CR30","first-page":"969974","volume":"21","author":"T. Keane","year":"2005","unstructured":"Keane, T., Naughton, T., Travers, S., McInerney, J., McCormack, G.: DPRml: distributed phylogeny reconstruction by maximum likelihood. Bioinformatics 21, 969974 (2005)","journal-title":"Bioinformatics"},{"key":"3_CR31","unstructured":"Keeneland: http:\/\/keeneland.gatech.edu\/. Cited 29 Jan 2014"},{"key":"3_CR32","unstructured":"Kepler Whitepaper: http:\/\/www.nvidia.com\/content\/PDF\/kepler\/NVIDIA-Kepler-GK110-Architecture-Whitepaper.pdf. Cited 16 Dec 2013"},{"key":"3_CR33","volume-title":"LAPACK Working Note 245: Autotuning GEMMs for Fermi","author":"J. Kurzak","year":"2011","unstructured":"Kurzak, J., Tomov, S., Dongarra, J.: LAPACK Working Note 245: Autotuning GEMMs for Fermi. Innovative Computing Laboratory, University of Tennessee (2011)"},{"key":"3_CR34","doi-asserted-by":"crossref","DOI":"10.2172\/1173292","volume-title":"LAPACK Working Note 267: Preliminary Results of Autotuning Gemm Kernels for the NVIDIA Kepler Architecture","author":"J. Kurzak","year":"2012","unstructured":"Kurzak, J., Luszczek, P., Tomov, S., Dongarra, J.: LAPACK Working Note 267: Preliminary Results of Autotuning Gemm Kernels for the NVIDIA Kepler Architecture. Innovative Computing Laboratory, University of Tennessee (2012)"},{"key":"3_CR35","unstructured":"Math Kernel Library (MKL): Intel(R). http:\/\/www.intel.com\/cd\/software\/products\/asmo-na\/eng.347757.htm. Cited 16 Dec 2013"},{"key":"3_CR36","doi-asserted-by":"publisher","first-page":"3794","DOI":"10.1093\/bioinformatics\/bti594","volume":"21","author":"B. Minh","year":"2005","unstructured":"Minh, B., Vinh, L., Haeseler, A., Schmidt, H.: pIQPNNI: parallel reconstruction of large maximum likelihood phylogenies. Bioinformatics 21, 3794\u20133796 (2005)","journal-title":"Bioinformatics"},{"key":"3_CR37","doi-asserted-by":"publisher","DOI":"10.1137\/S00361445024180","author":"C. Moler","year":"2003","unstructured":"Moler, C., Van Loan, C.: Nineteen dubious ways to compute the exponential of a matrix, twenty-five years later. SIAM Rev. (2003). doi: 10.1137\/S00361445024180","journal-title":"SIAM Rev."},{"key":"3_CR38","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1023\/A:1014362705613","volume":"22","author":"B. Moret","year":"2002","unstructured":"Moret, B., Badar, D., Warnow, T.: High-performance algorithm engineering for computational phylogenetics. J. Supercomput. 22, 99\u201311 (2002)","journal-title":"J. Supercomput."},{"issue":"4","key":"3_CR39","doi-asserted-by":"publisher","first-page":"511","DOI":"10.1177\/1094342010385729","volume":"24","author":"R. Nath","year":"2010","unstructured":"Nath, R., Tomov, S., Dongarra, J.: An improved MAGMA GEMM for Fermi GPUs. Int. J. High Perform. Comput. 24(4), 511\u2013515 (2010)","journal-title":"Int. J. High Perform. Comput."},{"issue":"2","key":"3_CR40","first-page":"503","volume":"18","author":"H. Schmidt","year":"2002","unstructured":"Schmidt, H., Strimmer, K., Vingron, M., Haeseler, A.: TREE-PUZZLE: maximum likelihood phylogenetic analysis using quartets and parallel computing. Bioinformatics 18(2), 503\u2013504 (2002)","journal-title":"Bioinformatics"},{"issue":"4","key":"3_CR41","doi-asserted-by":"publisher","first-page":"456","DOI":"10.1093\/bioinformatics\/bti191","volume":"21","author":"A. Stamatakis","year":"2005","unstructured":"Stamatakis, A., Meier, L.T.: RAxML-III: a fast program for maximum likelihood-based inference of large phylogenetic trees. Bioinformatics 21(4), 456\u2013463 (2005)","journal-title":"Bioinformatics"},{"key":"3_CR42","doi-asserted-by":"publisher","first-page":"1370","DOI":"10.1093\/bioinformatics\/btp244","volume":"25","author":"M. Suchard","year":"2009","unstructured":"Suchard, M., Rambaut, A.: Many-core algorithms for statistical phylogenetics. Bioinformatics 25, 1370\u20131376 (2009)","journal-title":"Bioinformatics"},{"issue":"4","key":"3_CR43","doi-asserted-by":"publisher","first-page":"1701","DOI":"10.1214\/aos\/1176325750","volume":"22","author":"L. Tierney","year":"1994","unstructured":"Tierney, L.: Markov chains for exploring posterior distributions. Ann. Stat. 22(4), 1701\u20131728 (1994)","journal-title":"Ann. Stat."},{"issue":"1\u20132","key":"3_CR44","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/S0167-8191(00)00087-9","volume":"27","author":"C.R. Whaley","year":"2001","unstructured":"Whaley, C.R., Petitet, A., Dongarra, J.: Automated empirical optimizations of software and the ATLAS project. Parallel Comput. 27(1\u20132), 3\u201335 (2001)","journal-title":"Parallel Comput."},{"key":"3_CR45","volume-title":"Genetic algorithm approaches for the phylogenetic analysis of large biological sequence datasets under the maximum likelihood criterion","author":"D. Zwickl","year":"2006","unstructured":"Zwickl, D.: Genetic algorithm approaches for the phylogenetic analysis of large biological sequence datasets under the maximum likelihood criterion. Ph.D. dissertation, University of Texas, Austin (2006)"}],"container-title":["Numerical Computations with GPUs"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-06548-9_3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,19]],"date-time":"2023-01-19T20:57:59Z","timestamp":1674161879000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-06548-9_3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319065472","9783319065489"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-06548-9_3","relation":{},"subject":[],"published":{"date-parts":[[2014]]},"assertion":[{"value":"9 June 2014","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}