{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,15]],"date-time":"2024-09-15T14:21:55Z","timestamp":1726410115957},"publisher-location":"Berlin, Heidelberg","reference-count":32,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642233968"},{"type":"electronic","value":"9783642233975"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-3-642-23397-5_34","type":"book-chapter","created":{"date-parts":[[2011,8,18]],"date-time":"2011-08-18T07:40:06Z","timestamp":1313653206000},"page":"340-352","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Application-Specific Fault Tolerance via Data Access Characterization"],"prefix":"10.1007","author":[{"given":"Nawab","family":"Ali","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sriram","family":"Krishnamoorthy","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Niranjan","family":"Govind","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Karol","family":"Kowalski","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ponnuswamy","family":"Sadayappan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"34_CR1","unstructured":"EMSL Basis Set Exchange, \n                    \n                      https:\/\/bse.pnl.gov\/bse\/portal"},{"key":"34_CR2","unstructured":"HPCToolkit, \n                    \n                      http:\/\/hpctoolkit.org"},{"key":"34_CR3","unstructured":"MPI, \n                    \n                      http:\/\/www.mpi-forum.org"},{"key":"34_CR4","doi-asserted-by":"crossref","unstructured":"Ali, N., Krishnamoorthy, S., Govind, N., Palmer, B.: A redundant communication approach to scalable fault tolerance in PGAS programming models. In: 19th Euromicro International Conference on Parallel, Distributed, and Network-Based Computing, pp. 24\u201331 (February 2011)","DOI":"10.1109\/PDP.2011.72"},{"key":"34_CR5","doi-asserted-by":"crossref","unstructured":"Ali, N., Krishnamoorthy, S., Halappanavar, M., Daily, J.: Tolerating correlated failures for generalized cartesian distributions via bipartite matching. In: ACM International Conference on Computing Frontiers (May 2011)","DOI":"10.1145\/2016604.2016649"},{"issue":"1","key":"34_CR6","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1103\/RevModPhys.79.291","volume":"79","author":"R.J. Bartlett","year":"2007","unstructured":"Bartlett, R.J., Musia\u0142, M.: Coupled-cluster theory in quantum chemistry. Reviews of Modern Physics\u00a079(1), 291\u2013352 (2007)","journal-title":"Reviews of Modern Physics"},{"issue":"4","key":"34_CR7","doi-asserted-by":"publisher","first-page":"410","DOI":"10.1016\/j.jpdc.2008.12.002","volume":"69","author":"G. Bosilca","year":"2009","unstructured":"Bosilca, G., Delmas, R., Dongarra, J., Langou, J.: Algorithm-based fault tolerance applied to high performance computing. Journal of Parallel and Distributed Computing\u00a069(4), 410\u2013416 (2009)","journal-title":"Journal of Parallel and Distributed Computing"},{"key":"34_CR8","doi-asserted-by":"crossref","unstructured":"Cappello, F., Guermouche, A., Snir, M.: On communication determinism in parallel HPC applications. In: 19th International Conference on Computer Communications and Networks, pp. 1\u20138 (August 2010)","DOI":"10.1109\/ICCCN.2010.5560143"},{"key":"34_CR9","doi-asserted-by":"crossref","unstructured":"Carns, P.H., Latham, R., Ross, R.B., Iskra, K., Lang, S., Riley, K.: 24\/7 characterization of petascale I\/O workloads. In: Proceedings of the First Workshop on Interfaces and Architectures for Scientific Data Storage, pp. 1\u201310 ( September 2009)","DOI":"10.1109\/CLUSTR.2009.5289150"},{"key":"34_CR10","unstructured":"Chen, Z., Dongarra, J.: Algorithm-based checkpoint-free fault tolerance for parallel matrix computations on volatile resources. In: Proceedings of the 20th International Parallel & Distributed Processing Symposium (April 2006)"},{"issue":"8","key":"34_CR11","doi-asserted-by":"publisher","first-page":"4088","DOI":"10.1063\/1.444319","volume":"77","author":"J.M. Cullen","year":"1982","unstructured":"Cullen, J.M., Zerner, M.C.: The linked singles and doubles model\u2013an approximate theory of electron correlation based on the coupled-cluster ansatz. The Journal of Chemical Physics\u00a077(8), 4088\u20134109 (1982)","journal-title":"The Journal of Chemical Physics"},{"issue":"3","key":"34_CR12","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1145\/568522.568525","volume":"34","author":"E.N. Elnozahy","year":"2002","unstructured":"Elnozahy, E.N., Alvisi, L., Wang, Y.M., Johnson, D.B.: A survey of rollback-recovery protocols in message-passing systems. ACM Computing Surveys\u00a034(3), 375\u2013408 (2002)","journal-title":"ACM Computing Surveys"},{"issue":"2","key":"34_CR13","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1109\/TDSC.2004.15","volume":"1","author":"E.N. Elnozahy","year":"2004","unstructured":"Elnozahy, E.N., Plank, J.S.: Checkpointing for peta-scale systems: A look into the future of practical rollback-recovery. IEEE Transactions on Dependable and Secure Computing\u00a01(2), 97\u2013108 (2004)","journal-title":"IEEE Transactions on Dependable and Secure Computing"},{"key":"34_CR14","doi-asserted-by":"crossref","unstructured":"Graham, S.L., Kessler, P.B., McKusick, M.K.: Gprof: A call graph execution profiler. In: Proceedings of the 1982 SIGPLAN Symposium on Compiler Construction, vol.\u00a017(6), pp. 120\u2013126 (1982)","DOI":"10.1145\/872726.806987"},{"issue":"1","key":"34_CR15","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1002\/(SICI)1096-987X(19960115)17:1<124::AID-JCC10>3.0.CO;2-N","volume":"17","author":"R.J. Harrison","year":"1996","unstructured":"Harrison, R.J., et al.: Toward high-performance computational chemistry: II. a scalable self-consistent field program. Journal of Computational Chemistry\u00a017(1), 124\u2013132 (1996)","journal-title":"Journal of Computational Chemistry"},{"key":"34_CR16","volume-title":"Molecular Electronic-Structure Theory","author":"T. Helgaker","year":"2004","unstructured":"Helgaker, T., Jorgensen, P., Olsen, J.: Molecular Electronic-Structure Theory. John Wiley & Sons Ltd., Chichester (2004)"},{"issue":"26","key":"34_CR17","doi-asserted-by":"publisher","first-page":"6896","DOI":"10.1039\/c002859b","volume":"12","author":"W.A. Jong","year":"2010","unstructured":"Jong, W.A., et al.: Utilizing high performance computing for chemistry: parallel computational chemistry. Physical Chemistry Chemical Physics\u00a012(26), 6896\u20136920 (2010)","journal-title":"Physical Chemistry Chemical Physics"},{"issue":"4A","key":"34_CR18","doi-asserted-by":"publisher","first-page":"1133","DOI":"10.1103\/PhysRev.140.A1133","volume":"140","author":"W. Kohn","year":"1965","unstructured":"Kohn, W., Sham, L.J.: Self-consistent equations including exchange and correlation effects. Physical Review\u00a0140(4A), A1133\u2013A1138 (1965)","journal-title":"Physical Review"},{"key":"34_CR19","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511805769","volume-title":"Electronic Structure: Basic Theory and Practical Methods","author":"R.M. Martin","year":"2004","unstructured":"Martin, R.M.: Electronic Structure: Basic Theory and Practical Methods. Cambridge University Press, Cambridge (2004)"},{"issue":"2","key":"34_CR20","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1177\/1094342006064503","volume":"20","author":"J. Nieplocha","year":"2006","unstructured":"Nieplocha, J., Palmer, B., Tipparaju, V., Krishnan, M., Trease, H., Apr\u00e0, E.: Advances, applications and performance of the global arrays shared memory programming toolkit. International Journal of High Performance Computing Applications\u00a020(2), 203\u2013231 (2006)","journal-title":"International Journal of High Performance Computing Applications"},{"issue":"10","key":"34_CR21","doi-asserted-by":"publisher","first-page":"1075","DOI":"10.1109\/71.539739","volume":"7","author":"N. Nieuwejaar","year":"1996","unstructured":"Nieuwejaar, N., Kotz, D., Purakayastha, A., Sclatter Ellis, C., Best, M.: File-access characteristics of parallel scientific workloads. IEEE Transactions on Parallel and Distributed Systems\u00a07(10), 1075\u20131089 (1996)","journal-title":"IEEE Transactions on Parallel and Distributed Systems"},{"key":"34_CR22","volume-title":"Density-Functional Theory of Atoms and Molecules","author":"R.G. Parr","year":"1989","unstructured":"Parr, R.G., Yang, W.: Density-Functional Theory of Atoms and Molecules. Oxford University Press, Inc., New York (1989)"},{"key":"34_CR23","doi-asserted-by":"crossref","unstructured":"Perdew, J.P., Schmidt, K.: Jacob\u2019s ladder of density functional approximations for the exchange-correlation energy. In: AIP Conference Proceedings, vol.\u00a0577(1), pp. 1\u201320 (2001)","DOI":"10.1063\/1.1390175"},{"key":"34_CR24","unstructured":"PETSc, \n                    \n                      http:\/\/www.mcs.anl.gov\/petsc\/petsc-as\/"},{"issue":"4","key":"34_CR25","doi-asserted-by":"publisher","first-page":"1910","DOI":"10.1063\/1.443164","volume":"76","author":"G.D. Purvis","year":"1982","unstructured":"Purvis, G.D., Bartlett, R.J.: A full coupled-cluster singles and doubles model\u2013the inclusion of disconnected triples. The Journal of Chemical Physics\u00a076(4), 1910\u20131918 (1982)","journal-title":"The Journal of Chemical Physics"},{"key":"34_CR26","doi-asserted-by":"crossref","unstructured":"Roth, P.C.: Characterizing the I\/O behavior of scientific applications on the Cray XT. In: Proceedings of the International Workshop on Petascale Data Storage, Reno, NV, pp. 50\u201355 (2007)","DOI":"10.1145\/1374596.1374609"},{"key":"34_CR27","doi-asserted-by":"crossref","unstructured":"Schroeder, B., Gibson, G.A.: Understanding failures in petascale computers. Journal of Physics: Conference Series\u00a078(1) (2007)","DOI":"10.1088\/1742-6596\/78\/1\/012022"},{"key":"34_CR28","doi-asserted-by":"crossref","unstructured":"Schulz, M., de Supinski, B.R.: P\n                    N\n                  MPI tools: A whole lot greater than the sum of their parts. In: Proceedings of the ACM\/IEEE Conference on Supercomputing, pp. 1\u201310 (2007)","DOI":"10.1145\/1362622.1362663"},{"issue":"2","key":"34_CR29","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1177\/1094342006064482","volume":"20","author":"S.S. Shende","year":"2006","unstructured":"Shende, S.S., Malony, A.D.: The TAU parallel performance system. International Journal of High Performance Computing Applications\u00a020(2), 287\u2013311 (2006)","journal-title":"International Journal of High Performance Computing Applications"},{"key":"34_CR30","volume-title":"Modern Quantum Chemistry","author":"A. Szabo","year":"1996","unstructured":"Szabo, A., Ostlund, N.S.: Modern Quantum Chemistry. McGraw-Hill Inc., New York (1996)"},{"issue":"1","key":"34_CR31","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1177\/1094342005051521","volume":"19","author":"R. Thakur","year":"2005","unstructured":"Thakur, R., Rabenseifner, R., Gropp, W.: Optimization of collective communication operations in mpich. International Journal of High Performance Computing Applications\u00a019(1), 49\u201366 (2005)","journal-title":"International Journal of High Performance Computing Applications"},{"issue":"9","key":"34_CR32","doi-asserted-by":"publisher","first-page":"1477","DOI":"10.1016\/j.cpc.2010.04.018","volume":"181","author":"M. Valiev","year":"2010","unstructured":"Valiev, M., et al.: NWChem: A comprehensive and scalable open-source solution for large scale molecular simulations. Computer Physics Communications\u00a0181(9), 1477\u20131489 (2010)","journal-title":"Computer Physics Communications"}],"container-title":["Lecture Notes in Computer Science","Euro-Par 2011 Parallel Processing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-23397-5_34","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,20]],"date-time":"2020-04-20T00:46:09Z","timestamp":1587343569000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-23397-5_34"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9783642233968","9783642233975"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-23397-5_34","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2011]]},"assertion":[{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}