{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T14:18:41Z","timestamp":1769005121064,"version":"3.49.0"},"reference-count":37,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,9]]},"DOI":"10.1109\/cluster.2014.6968768","type":"proceedings-article","created":{"date-parts":[[2014,12,2]],"date-time":"2014-12-02T22:40:03Z","timestamp":1417560003000},"page":"103-112","source":"Crossref","is-referenced-by-count":32,"title":["Digging deeper into cluster system logs for failure prediction and root cause diagnosis"],"prefix":"10.1109","author":[{"given":"Xiaoyu","family":"Fu","sequence":"first","affiliation":[]},{"given":"Rui","family":"Ren","sequence":"additional","affiliation":[]},{"given":"Sally A.","family":"McKee","sequence":"additional","affiliation":[]},{"given":"Jianfeng","family":"Zhan","sequence":"additional","affiliation":[]},{"given":"Ninghui","family":"Sun","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","first-page":"476","article-title":"Filtering failure logs for a bluegene\/l prototype","author":"liang","year":"2005","journal-title":"International Conference on Dependable Systems and Networks"},{"key":"35","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2009.5270289"},{"key":"17","doi-asserted-by":"crossref","first-page":"652","DOI":"10.1016\/j.jpdc.2009.03.007","article-title":"An analysis of clustered failures on large supercomputing systems","volume":"69","author":"hacker","year":"2009","journal-title":"Elsever Trans Journal of Parallel and Distributed Computing"},{"key":"36","doi-asserted-by":"publisher","DOI":"10.1109\/DSNW.2010.5542627"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1145\/1401890.1401938"},{"key":"33","doi-asserted-by":"publisher","DOI":"10.1109\/DSNW.2011.5958823"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2008.17"},{"key":"34","first-page":"28","article-title":"Context-based online configuration-error detection","author":"yuan","year":"2011","journal-title":"USENIX Annual Technical Conference"},{"key":"16","first-page":"40","article-title":"A meta-learning failure predictor for blue gene\/l systems","author":"gujrati","year":"2007","journal-title":"International Conference on Parallel Processing"},{"key":"13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-23400-2_6"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2012.107"},{"key":"37","doi-asserted-by":"publisher","DOI":"10.1145\/2371536.2371571"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/SRDS.2012.40"},{"key":"12","first-page":"4","article-title":"Adaptive event prediction strategy with dynamic time window for largescale hpc systems","author":"gainaru","year":"2011","journal-title":"SOSP Workshop on Managing Large-Scale Systems Via the Analysis of System Logs and the Application of Machine Learning Techniques"},{"key":"21","first-page":"398","article-title":"A log mining approach to failure analysis of enterprise telephony systems","author":"lim","year":"2008","journal-title":"International Conference on Dependable Systems and Networks"},{"key":"20","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2007.46"},{"key":"22","year":"0"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1145\/1592568.1592596"},{"key":"24","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2004.1311948"},{"key":"25","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2006.5"},{"key":"26","doi-asserted-by":"publisher","DOI":"10.1109\/ARES.2009.105"},{"key":"27","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2012.6263917"},{"key":"28","author":"tooley","year":"1987","journal-title":"Causation A Realist Approach"},{"key":"29","doi-asserted-by":"publisher","DOI":"10.1038\/30918"},{"key":"3","first-page":"227","article-title":"One graph is worth a thousand logs: Uncovering hidden structures in massive system event logs","volume":"5781","author":"aharon","year":"2009","journal-title":"European Conference on Machine Learning and Principles and Practices of Knowledge Discovery in Databases 2009"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2010.5544270"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1145\/1362622.1362678"},{"key":"1","first-page":"60","article-title":"An overview of the BlueGene\/L supercomputer","author":"adiga","year":"2002","journal-title":"Supercomputing Nov"},{"key":"30","doi-asserted-by":"publisher","DOI":"10.1016\/j.jpdc.2012.09.007"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1109\/SRDS.2013.20"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1109\/HIPC.2010.5713159"},{"key":"32","doi-asserted-by":"publisher","DOI":"10.1109\/GRID.2010.5697961"},{"key":"5","first-page":"94","article-title":"Log analytics for dependable enterprise telephony","author":"chen","year":"2012","journal-title":"European Dependable Computing Conference"},{"key":"31","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2009.19"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2013.74"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1109\/SRDS.2007.18"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2013.6575356"}],"event":{"name":"2014 IEEE International Conference On Cluster Computing (CLUSTER)","location":"Madrid, Spain","start":{"date-parts":[[2014,9,22]]},"end":{"date-parts":[[2014,9,26]]}},"container-title":["2014 IEEE International Conference on Cluster Computing (CLUSTER)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6957006\/6968662\/06968768.pdf?arnumber=6968768","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,10,14]],"date-time":"2020-10-14T14:43:13Z","timestamp":1602686593000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/6968768"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,9]]},"references-count":37,"URL":"https:\/\/doi.org\/10.1109\/cluster.2014.6968768","relation":{},"subject":[],"published":{"date-parts":[[2014,9]]}}}