{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:05:55Z","timestamp":1759133155627},"publisher-location":"Cham","reference-count":32,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319143125"},{"type":"electronic","value":"9783319143132"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-14313-2_49","type":"book-chapter","created":{"date-parts":[[2014,12,11]],"date-time":"2014-12-11T01:56:46Z","timestamp":1418263006000},"page":"577-588","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["ESSEX: Equipping Sparse Solvers for Exascale"],"prefix":"10.1007","author":[{"given":"Andreas","family":"Alvermann","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Achim","family":"Basermann","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Holger","family":"Fehske","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Martin","family":"Galgon","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Georg","family":"Hager","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Moritz","family":"Kreutzer","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lukas","family":"Kr\u00e4mer","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bruno","family":"Lang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andreas","family":"Pieper","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Melven","family":"R\u00f6hrig-Z\u00f6llner","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Faisal","family":"Shahzad","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jonas","family":"Thies","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gerhard","family":"Wellein","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"49_CR1","unstructured":"Threading and GPGPU support in PETSc, \n                    \n                      http:\/\/www.mcs.anl.gov\/petsc\/features\/"},{"key":"49_CR2","unstructured":"Parallel Arnoldi package (PARPACK) homepage, \n                    \n                      http:\/\/www.caam.rice.edu\/~kristyn\/parpack_home.html"},{"key":"49_CR3","unstructured":"Anasazi package homepage, \n                    \n                      http:\/\/trilinos.sandia.gov\/packages\/anasazi\/"},{"key":"49_CR4","unstructured":"LAMA \u2014 Library for Accelerated Math Applications, \n                    \n                      http:\/\/www.libama.org"},{"key":"49_CR5","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1007\/s00450-011-0159-z","volume":"26","author":"M. F\u00f6rster","year":"2011","unstructured":"F\u00f6rster, M., Kraus, J.: Scalable parallel AMG on ccNUMA machines with OpenMP. Computer Science - Research and Development\u00a026, 221\u2013228 (2011) ISSN 1865-2034","journal-title":"Computer Science - Research and Development"},{"key":"49_CR6","unstructured":"pOSKI: parallel optimized sparse kernel interface, \n                    \n                      http:\/\/bebop.cs.berkeley.edu\/poski"},{"key":"49_CR7","doi-asserted-by":"crossref","unstructured":"Bautista-Gomez, L., Tsuboi, S., Komatitsch, D., Cappello, F., Maruyama, N., Matsuoka, S.: FTI: high performance fault tolerance interface for hybrid systems. In: Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis, SC 2011, pp. 32:1\u201332:32. ACM, New York (2011)","DOI":"10.1145\/2063384.2063427"},{"key":"49_CR8","first-page":"351","volume-title":"Proceedings of the Twenty-Fifth International Symposium on Fault-Tolerant Computing, FTCS 1995","author":"J.S. Plank","year":"1995","unstructured":"Plank, J.S., Kim, Y., Dongarra, J.J.: Algorithm-based diskless checkpointing for fault-tolerant matrix operations. In: Proceedings of the Twenty-Fifth International Symposium on Fault-Tolerant Computing, FTCS 1995, pp. 351\u2013360. IEEE Computer Society, Washington, DC (1995)"},{"key":"49_CR9","first-page":"150","volume-title":"Symposium on Application Accelerators in High-Performance Computing","author":"M. Horton","year":"2011","unstructured":"Horton, M., Tomov, S., Dongarra, J.: A class of hybrid LAPACK algorithms for multicore and GPU architectures. In: Symposium on Application Accelerators in High-Performance Computing, pp. 150\u2013158. IEEE Computer Society, Los Alamitos (2011)"},{"key":"49_CR10","doi-asserted-by":"crossref","unstructured":"Hager, G., Treibig, J., Habich, J., Wellein, G.: Exploring performance and power properties of modern multicore chips via simple machine models. Concurrency Computat. Pract. Exper. (2013), doi:10.1002\/cpe.3180","DOI":"10.1002\/cpe.3180"},{"key":"49_CR11","doi-asserted-by":"publisher","first-page":"115112","DOI":"10.1103\/PhysRevB.79.115112","volume":"79","author":"E. Polizzi","year":"2009","unstructured":"Polizzi, E.: Density-matrix-based algorithm for solving eigenvalue problems. Phys. Rev. B\u00a079, 115112 (2009)","journal-title":"Phys. Rev. B"},{"key":"49_CR12","doi-asserted-by":"publisher","first-page":"275","DOI":"10.1103\/RevModPhys.78.275","volume":"78","author":"A. Wei\u00dfe","year":"2006","unstructured":"Wei\u00dfe, A., Wellein, G., Alvermann, A., Fehske, H.: The kernel polynomial method. Rev. Mod. Phys.\u00a078, 275 (2006)","journal-title":"Rev. Mod. Phys."},{"key":"49_CR13","doi-asserted-by":"publisher","first-page":"3967","DOI":"10.1063\/1.448136","volume":"81","author":"H. Tal-Ezer","year":"1984","unstructured":"Tal-Ezer, H., Kosloff, R.: An accurate and efficient scheme for propagating the time dependent Schr\u00f6dinger equation. J. Chem. Phys.\u00a081, 3967 (1984)","journal-title":"J. Chem. Phys."},{"key":"49_CR14","doi-asserted-by":"publisher","first-page":"2182","DOI":"10.1016\/j.physleta.2009.04.022","volume":"373","author":"H. Fehske","year":"2009","unstructured":"Fehske, H., Schleede, J., Schubert, G., Wellein, G., Filinov, V.S., Bishop, A.R.: Numerical approaches to time evolution of complex quantum systems. Phys. Lett. A\u00a0373, 2182 (2009)","journal-title":"Phys. Lett. A"},{"key":"49_CR15","doi-asserted-by":"publisher","first-page":"5930","DOI":"10.1016\/j.jcp.2011.04.006","volume":"230","author":"A. Alvermann","year":"2011","unstructured":"Alvermann, A., Fehske, H.: High-order commutator-free exponential time-propagation of driven quantum systems. J. Comp. Phys.\u00a0230, 5930 (2011)","journal-title":"J. Comp. Phys."},{"key":"49_CR16","unstructured":"di Napoli, E., Polizzi, E., Saad, Y.: Efficient estimation of eigenvalue counts in an interval, Preprint arXiv:1308.4275 (2013)"},{"key":"49_CR17","unstructured":"Bhardwaj, O., Ineichen, Y., Bekas, C., Curioni, A.: Highly scalable linear time estimation of spectrograms - a tool for very large scale data analysis. Poster at 2013 ACM\/IEEE International Conference on High Performance Computing Networking, Storage and Analysis (2013)"},{"key":"49_CR18","doi-asserted-by":"publisher","first-page":"195409","DOI":"10.1103\/PhysRevB.88.195409","volume":"88","author":"A. Pieper","year":"2013","unstructured":"Pieper, A., Schubert, G., Wellein, G., Fehske, H.: Effects of disorder and contacts on transport through graphene nanoribbons. Phys. Rev. B\u00a088, 195409 (2013)","journal-title":"Phys. Rev. B"},{"key":"49_CR19","doi-asserted-by":"publisher","first-page":"165121","DOI":"10.1103\/PhysRevB.89.165121","volume":"89","author":"A. Pieper","year":"2014","unstructured":"Pieper, A., Heinisch, R.L., Wellein, G., Fehske, H.: Dot-bound and dispersive states in graphene quantum dot superlattices. Phys. Rev. B\u00a089, 165121 (2014)","journal-title":"Phys. Rev. B"},{"key":"49_CR20","doi-asserted-by":"crossref","unstructured":"Kr\u00e4mer, L., Galgon, M., Lang, B., Alvermann, A., Fehske, H., Pieper, A.: Improving robustness of the FEAST algorithm and solving eigenvalue problems from graphene nanoribbons (Submitted to PAMM 2014)","DOI":"10.1002\/pamm.201410391"},{"key":"49_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.cam.2012.11.014","volume":"244","author":"L. Kr\u00e4mer","year":"2013","unstructured":"Kr\u00e4mer, L., Di Napoli, E., Galgon, M., Lang, B., Bientinesi, P.: Dissecting the FEAST algorithm for generalized eigenproblems. J. Comput. Appl. Math.\u00a0244, 1\u20139 (2013)","journal-title":"J. Comput. Appl. Math."},{"key":"49_CR22","unstructured":"Kr\u00e4mer, L.: Integration Based Solvers for Standard and Generalized Eigenvalue Problems. Ph.D. thesis, Bergische Universit\u00e4t Wuppertal (2014)"},{"key":"49_CR23","unstructured":"R\u00f6hrig-Z\u00f6llner, M., Thies, J., Kreutzer, M., Alvermann, A., Pieper, A., Basermann, A., Hager, G., Wellein, G., Fehske, H.: Increasing the performance of the Jacobi-Davidson method by blocking. SIAM J. Sci. Comput. (Submitted)"},{"key":"49_CR24","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1007\/978-3-642-33518-1_36","volume-title":"Recent Advances in the Message Passing Interface","author":"F. Shahzad","year":"2012","unstructured":"Shahzad, F., Wittmann, M., Zeiser, T., Wellein, G.: Asynchronous checkpointing by dedicated checkpoint threads. In: Tr\u00e4ff, J.L., Benkner, S., Dongarra, J.J. (eds.) EuroMPI 2012. LNCS, vol.\u00a07490, pp. 289\u2013290. Springer, Heidelberg (2012)"},{"issue":"04","key":"49_CR25","doi-asserted-by":"publisher","first-page":"13400111","DOI":"10.1142\/S0129626413400112","volume":"23","author":"F. Shahzad","year":"2013","unstructured":"Shahzad, F., Wittmann, M., Kreutzer, M., Zeiser, T., Hager, G., Wellein, G.: A survey of checkpoint\/restart techniques on distributed memory systems. Parallel Processing Letters\u00a023(04), 13400111\u2013134001120 (2013)","journal-title":"Parallel Processing Letters"},{"key":"49_CR26","doi-asserted-by":"crossref","unstructured":"Shahzad, F., Wittmann, M., Zeiser, T., Hager, G., Wellein, G.: An evaluation of different I\/O techniques for checkpoint\/restart. In: Proceedings of the 2013 IEEE 27th International Parallel and Distributed Processing Symposium Workshops & PhD Forum (IPDPSW), pp. 1708\u20131716. IEEE Computer Society (2013)","DOI":"10.1109\/IPDPSW.2013.145"},{"key":"49_CR27","unstructured":"Shahzad, F., Wittmann, M., Kreutzer, M., Zeiser, T., Hager, G., Wellein, G.: PGAS implementation of SPMVM and LBM with GPI. In: Proceedings of the 7th International Conference on PGAS Programming Models, pp. 172\u2013184 (2013)"},{"key":"49_CR28","doi-asserted-by":"crossref","unstructured":"Bell, N., Garland, M.: Implementing sparse matrix-vector multiplication on throughput-oriented processors. In:Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis, SC 2009, pp. 18:1\u201318:11. ACM, New York (2009)","DOI":"10.1145\/1654059.1654078"},{"key":"49_CR29","doi-asserted-by":"crossref","unstructured":"Kreutzer, M., Hager, G., Wellein, G., Fehske, H., Bishop, A.: A unified sparse matrix data format for efficient general sparse matrix-vector multiplication on modern processors with wide SIMD units. SIAM Journal on Scientific Computing\u00a036(5), C401\u2013C423 (2014)","DOI":"10.1137\/130930352"},{"key":"49_CR30","doi-asserted-by":"crossref","unstructured":"M\u00fcthing, S., Ribbrock, D., G\u00f6ddeke, D.: Integrating multi-threading and accelerators into DUNE-ISTL. In: Proceedings of ENUMATH 2013 (accepted 2014)","DOI":"10.1007\/978-3-319-10705-9_59"},{"key":"49_CR31","unstructured":"Anzt, H., Tomov, S., Dongarra, J.: Implementing a sparse matrix vector product for the SELL-C\/SELL-C-\u03c3 formats on NVIDIA GPUs. Tech. rep. (March 2014), \n                    \n                      http:\/\/www.eecs.utk.edu\/resources\/library\/585"},{"key":"49_CR32","unstructured":"Intel Math Kernel Library (MKL), \n                    \n                      https:\/\/software.intel.com\/en-us\/intel-mkl"}],"container-title":["Lecture Notes in Computer Science","Euro-Par 2014: Parallel Processing Workshops"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-14313-2_49","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,20]],"date-time":"2020-04-20T00:26:41Z","timestamp":1587342401000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-14313-2_49"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319143125","9783319143132"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-14313-2_49","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]},"assertion":[{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}