{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,13]],"date-time":"2025-06-13T06:05:59Z","timestamp":1749794759443},"publisher-location":"Berlin, Heidelberg","reference-count":20,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642037696"},{"type":"electronic","value":"9783642037702"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-03770-2_15","type":"book-chapter","created":{"date-parts":[[2009,9,2]],"date-time":"2009-09-02T07:52:09Z","timestamp":1251877929000},"page":"84-93","source":"Crossref","is-referenced-by-count":3,"title":["In-Memory Checkpointing for MPI Programs by XOR-Based Double-Erasure Codes"],"prefix":"10.1007","author":[{"given":"Gang","family":"Wang","sequence":"first","affiliation":[]},{"given":"Xiaoguang","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Ang","family":"Li","sequence":"additional","affiliation":[]},{"given":"Fan","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"15_CR1","unstructured":"http:\/\/www.top500.org"},{"issue":"3","key":"15_CR2","first-page":"12","volume":"1","author":"F. Wu-Chun","year":"2005","unstructured":"Wu-Chun, F.: The Importance of Being Low Power in High Performance Computing. Cyberinfrastructure Technology Watch Quarterly\u00a01(3), 12\u201321 (2005)","journal-title":"Cyberinfrastructure Technology Watch Quarterly"},{"key":"15_CR3","unstructured":"Message Passing Interface Forum: MPI: A Message Passing Interface Standard. Technical report, University of Tennessee (1994)"},{"key":"15_CR4","doi-asserted-by":"crossref","unstructured":"Stellner, G.: CoCheck: Checkpointing and Process Migration for MPI. In: 10th International Parallel Processing Symposium, Honolulu, USA, pp. 526\u2013531 (1996)","DOI":"10.1109\/IPPS.1996.508106"},{"key":"15_CR5","doi-asserted-by":"crossref","unstructured":"Agbaria, A., Friedman, R.: Starfish: Fault-Tolerant Dynamic MPI Programs on Clusters of Workstations. In: 8th IEEE International Symposium on High Performance Distributed Computing, Redondo Beach, California, USA, pp. 167\u2013176 (1999)","DOI":"10.1109\/HPDC.1999.805295"},{"key":"15_CR6","doi-asserted-by":"crossref","unstructured":"Bosilca, G., Bouteiller, A., Cappello, F., Djilali, S., Fedak, G., Germain, C., Herault, T., Lemarinier, P., Lodygensky, O., Magniette, F., Neri, V., Selikhov, A.: MPICH-V: Toward a scalable fault tolerant MPI for volatile nodes. In: 2002 ACM\/IEEE conference on Supercomputing, Baltimore, Maryland, USA, pp. 1\u201318 (2002)","DOI":"10.1109\/SC.2002.10048"},{"key":"15_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"346","DOI":"10.1007\/3-540-45255-9_47","volume-title":"Recent Advances in Parallel Virtual Machine and Message Passing Interface","author":"G.E. Fagg","year":"2000","unstructured":"Fagg, G.E., Dongarra, J.: FT-MPI: Fault tolerant MPI, supporting dynamic applications in a dynamic world. In: Dongarra, J., Kacsuk, P., Podhorszki, N. (eds.) PVM\/MPI 2000. LNCS, vol.\u00a01908, pp. 346\u2013353. Springer, Heidelberg (2000)"},{"issue":"10","key":"15_CR8","doi-asserted-by":"publisher","first-page":"972","DOI":"10.1109\/71.730527","volume":"9","author":"J.S. Plank","year":"1998","unstructured":"Plank, J.S., Li, K., Puening, M.A.: Diskless checkpointing. IEEE Trans. Parallel Distrib. Syst.\u00a09(10), 972\u2013986 (1998)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"15_CR9","doi-asserted-by":"crossref","unstructured":"Chen, Z., Fagg, G., Gabriel, E., Langou, J., Angskun, T., Bosilca, G., Dongarra, J.: Fault Tolerant High Performance Computing by a Coding Approach. In: 10th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, Chicago, IL, USA, pp. 213\u2013223 (2005)","DOI":"10.1145\/1065944.1065973"},{"key":"15_CR10","unstructured":"Liu, X.G., Wang, G., Zhang, Y., Li, A., Xie, F.: The Performance Of Erasure Codes Used In FT-MPI. In: 2nd International Forum on Information Technology and Applications, Chengdu, China (2005)"},{"key":"15_CR11","unstructured":"Plank, J.S.: Erasure Codes for Storage Applications. Tutorial. In: 4th Usenix Conference on File and Storage Technologies, San Francisco, CA, USA (2005)"},{"issue":"2","key":"15_CR12","doi-asserted-by":"publisher","first-page":"143","DOI":"10.1145\/176979.176981","volume":"26","author":"P.M. Chen","year":"1994","unstructured":"Chen, P.M., Lee, E.K., Gibson, G.A., Katz, R.H., Patterson, D.A.: RAID: High-Performance, Reliable Secondary Storage. ACM Computing Surveys\u00a026(2), 143\u2013185 (1994)","journal-title":"ACM Computing Surveys"},{"issue":"9","key":"15_CR13","doi-asserted-by":"publisher","first-page":"995","DOI":"10.1002\/(SICI)1097-024X(199709)27:9<995::AID-SPE111>3.0.CO;2-6","volume":"27","author":"J.S. Plank","year":"1997","unstructured":"Plank, J.S.: A Tutorial on Reed-Solomon Coding for Fault-Tolerance in RAID-like Systems. Software - Practice & Experience\u00a027(9), 995\u20131012 (1997)","journal-title":"Software - Practice & Experience"},{"key":"15_CR14","unstructured":"Corbett, P., English, B., Goel, A., Grcanac, T., Kleiman, S., Leong, J., Sankar, S.: Row-Diagonal Parity for Double Disk Failure Correction. In: 3rd USENIX Conference on File and Storage Technologies, San Francisco, CA, USA, pp. 1\u201314 (2004)"},{"key":"15_CR15","doi-asserted-by":"crossref","unstructured":"Blaum, M.: A Family of MDS Array Codes with Minimal Number of Encoding Operations. In: 2006 IEEE International Symposium on Information Theory, Washington, USA, pp. 2784\u20132788 (2006)","DOI":"10.1109\/ISIT.2006.261569"},{"issue":"6","key":"15_CR16","doi-asserted-by":"publisher","first-page":"1817","DOI":"10.1109\/18.782102","volume":"45","author":"L. Xu","year":"1999","unstructured":"Xu, L., Bohossian, V., Bruck, J., Wagner, D.G.: Low-Density MDS Codes and Factors of Complete Graphs. IEEE Trans. on Information Theory\u00a045(6), 1817\u20131826 (1999)","journal-title":"IEEE Trans. on Information Theory"},{"key":"15_CR17","volume-title":"Handbook of Combinatorial Designs","author":"C.J. Colbourn","year":"2007","unstructured":"Colbourn, C.J., Dinitz, J.H., et al.: Handbook of Combinatorial Designs, 2nd edn. CRC Press, Boca Raton (2007)","edition":"2"},{"key":"15_CR18","unstructured":"Plank, J.S.: The RAID-6 Liberation Codes. In: 6th USENIX Conference on File and Storage Technologies, San Francisco, USA, pp. 97\u2013110 (2008)"},{"key":"15_CR19","volume-title":"Introduction to Parallel Computing","author":"A. Grama","year":"2003","unstructured":"Grama, A., Gupta, A., Karypis, G., Kumar, V.: Introduction to Parallel Computing, 2nd edn. Addison Wesley, Edinburgh Gate (2003)","edition":"2"},{"key":"15_CR20","unstructured":"http:\/\/math.nist.gov\/MatrixMarket\/data\/Harwell-Boeing\/bcsstruc3\/bcsstk23.html"}],"container-title":["Lecture Notes in Computer Science","Recent Advances in Parallel Virtual Machine and Message Passing Interface"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-03770-2_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,22]],"date-time":"2019-05-22T09:57:05Z","timestamp":1558519025000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-03770-2_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642037696","9783642037702"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-03770-2_15","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}