{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,18]],"date-time":"2025-11-18T01:32:37Z","timestamp":1763429557078},"reference-count":17,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"5","license":[{"start":{"date-parts":[[2018,9,1]],"date-time":"2018-09-01T00:00:00Z","timestamp":1535760000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Cloud Comput."],"published-print":{"date-parts":[[2018,9]]},"DOI":"10.1109\/mcc.2018.053711662","type":"journal-article","created":{"date-parts":[[2018,10,18]],"date-time":"2018-10-18T19:07:11Z","timestamp":1539889631000},"page":"12-21","source":"Crossref","is-referenced-by-count":42,"title":["Emergent Failures: Rethinking Cloud Reliability at Scale"],"prefix":"10.1109","volume":"5","author":[{"given":"Peter","family":"Garraghan","sequence":"first","affiliation":[]},{"given":"Renyu","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Zhenyu","family":"Wen","sequence":"additional","affiliation":[]},{"given":"Alexander","family":"Romanovsky","sequence":"additional","affiliation":[]},{"given":"Jie","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Rajkumar","family":"Buyya","sequence":"additional","affiliation":[]},{"given":"Rajiv","family":"Ranjan","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/2523616.2523633"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.14778\/2733004.2733012"},{"key":"ref12","first-page":"285","article-title":"Apollo: Scalable and Coordinated Scheduling for Cloud-Scale Computing","author":"boutin","year":"0","journal-title":"Proc of USENIX Conference on Operating Systems Design and Implementation (OSDI)"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2018.00096"},{"key":"ref14","author":"sossa","year":"2018","journal-title":"Container-Based Cluster Orchestration Systems A Taxonomy and Future Directions"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/2838344.2839461"},{"key":"ref16","first-page":"5434","article-title":"Straggler Mitigation in Distributed Optimization Through Data Encoding","author":"karakus","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TSC.2016.2544313"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/2408776.2408794"},{"key":"ref3","article-title":"Straggler Root Cause and Impact Analysis for Massive scale Virtualized Cloud Datacenters","author":"garraghan","year":"2016","journal-title":"IEEE Transactions on Services Computing"},{"key":"ref6","article-title":"Amazon S3 Outage Highlights Resilience Issues with Cloud Infrastructure","author":"thompson","year":"2017","journal-title":"Argonne National Laboratory"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TDSC.2004.2"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1145\/2898442.2898444","article-title":"Borg, Omega, and Kubernetes","volume":"14","author":"burns","year":"2016","journal-title":"ACM Queue"},{"key":"ref7","first-page":"18","article-title":"Large-scale cluster management at Google with Borg","author":"verma","year":"0","journal-title":"Proceedings of the Tenth European Conference on Computer Systems (EuroSys'15)"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TETC.2014.2304500"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/DSN.2006.5"},{"key":"ref9","first-page":"295","article-title":"Mesos: A Platform for Fine-Grained Resource Sharing in the Data Center","author":"hindman","year":"0","journal-title":"Proceedings of the 8th USENIX Conference on Networked Systems Design and Implementation (NSDI '11)"}],"container-title":["IEEE Cloud Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6509491\/8497001\/08497007.pdf?arnumber=8497007","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T22:01:06Z","timestamp":1643234466000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8497007\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,9]]},"references-count":17,"journal-issue":{"issue":"5"},"URL":"https:\/\/doi.org\/10.1109\/mcc.2018.053711662","relation":{},"ISSN":["2325-6095","2372-2568"],"issn-type":[{"value":"2325-6095","type":"electronic"},{"value":"2372-2568","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,9]]}}}