{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,6]],"date-time":"2026-06-06T01:03:37Z","timestamp":1780707817420,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":60,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"NSF","award":["CCF-1816615, CCF-2029049, CNF-1956007"],"award-info":[{"award-number":["CCF-1816615, CCF-2029049, CNF-1956007"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1145\/3458336.3465276","type":"proceedings-article","created":{"date-parts":[[2021,6,4]],"date-time":"2021-06-04T02:03:56Z","timestamp":1622772236000},"page":"213-220","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["Reasoning about modern datacenter infrastructures using partial histories"],"prefix":"10.1145","author":[{"given":"Xudong","family":"Sun","sequence":"first","affiliation":[{"name":"University of Illinois"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lalith","family":"Suresh","sequence":"additional","affiliation":[{"name":"VMware"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Aishwarya","family":"Ganesan","sequence":"additional","affiliation":[{"name":"VMware"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ramnatthan","family":"Alagappan","sequence":"additional","affiliation":[{"name":"VMware"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Michael","family":"Gasch","sequence":"additional","affiliation":[{"name":"VMware"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lilia","family":"Tang","sequence":"additional","affiliation":[{"name":"University of Illinois"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Tianyin","family":"Xu","sequence":"additional","affiliation":[{"name":"University of Illinois"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2021,6,3]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"https:\/\/github.com\/kubernetes\/community\/blob\/master\/contributors\/design-proposals\/api-machinery\/apiserver-watch.md","year":"2017","unstructured":"apiserver-watch.md. https:\/\/github.com\/kubernetes\/community\/blob\/master\/contributors\/design-proposals\/api-machinery\/apiserver-watch.md , 2017 . apiserver-watch.md. https:\/\/github.com\/kubernetes\/community\/blob\/master\/contributors\/design-proposals\/api-machinery\/apiserver-watch.md, 2017."},{"key":"e_1_3_2_1_2_1","volume-title":"Aug.","author":"Comment","year":"2019","unstructured":"Comment on Kubernetes-59848 : Kubernetes is vulnerable to stale reads, violating critical pod safety guarantees. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/59848#issuecomment-525833106 , Aug. 2019 . Comment on Kubernetes-59848: Kubernetes is vulnerable to stale reads, violating critical pod safety guarantees. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/59848#issuecomment-525833106, Aug. 2019."},{"key":"e_1_3_2_1_3_1","volume-title":"https:\/\/github.com\/frankmcsherry\/differential-dataflow","author":"Differential Dataflow","year":"2019","unstructured":"Differential Dataflow . https:\/\/github.com\/frankmcsherry\/differential-dataflow , 2019 . Differential Dataflow. https:\/\/github.com\/frankmcsherry\/differential-dataflow, 2019."},{"key":"e_1_3_2_1_4_1","volume-title":"https:\/\/jepsen.io\/","author":"Jepsen","year":"2020","unstructured":"Jepsen . https:\/\/jepsen.io\/ , 2020 . Jepsen. https:\/\/jepsen.io\/, 2020."},{"key":"e_1_3_2_1_5_1","volume-title":"Disallow ApiServer HA for Pod Safety. https:\/\/github.com\/microsoft\/pai\/issues\/4120","year":"2020","unstructured":"P0.5 : Disallow ApiServer HA for Pod Safety. https:\/\/github.com\/microsoft\/pai\/issues\/4120 , 2020 . P0.5: Disallow ApiServer HA for Pod Safety. https:\/\/github.com\/microsoft\/pai\/issues\/4120, 2020."},{"key":"e_1_3_2_1_6_1","volume-title":"https:\/\/zookeeper.apache.org\/doc\/r3.3.3\/zookeeperProgrammers.html#ch_zkWatches","author":"ZooKeeper Watches","year":"2020","unstructured":"ZooKeeper Watches . https:\/\/zookeeper.apache.org\/doc\/r3.3.3\/zookeeperProgrammers.html#ch_zkWatches , 2020 . ZooKeeper Watches. https:\/\/zookeeper.apache.org\/doc\/r3.3.3\/zookeeperProgrammers.html#ch_zkWatches, 2020."},{"key":"e_1_3_2_1_7_1","volume-title":"https:\/\/github.com\/kubernetes\/enhancements\/blob\/master\/keps\/sig-api-machinery\/1904-efficient-watch-resumption\/README.md","author":"Efficient","year":"2021","unstructured":"Efficient watch resumption after kube-apiserver reboot. https:\/\/github.com\/kubernetes\/enhancements\/blob\/master\/keps\/sig-api-machinery\/1904-efficient-watch-resumption\/README.md , 2021 . Efficient watch resumption after kube-apiserver reboot. https:\/\/github.com\/kubernetes\/enhancements\/blob\/master\/keps\/sig-api-machinery\/1904-efficient-watch-resumption\/README.md, 2021."},{"key":"e_1_3_2_1_8_1","volume-title":"https:\/\/etcd.io\/","year":"2021","unstructured":"etcd. https:\/\/etcd.io\/ , 2021 . etcd. https:\/\/etcd.io\/, 2021."},{"key":"e_1_3_2_1_9_1","volume-title":"https:\/\/etcd.io\/docs\/v3.4.0\/learning\/api\/","author":"API.","year":"2021","unstructured":"etcd API. https:\/\/etcd.io\/docs\/v3.4.0\/learning\/api\/ , 2021 . etcd API. https:\/\/etcd.io\/docs\/v3.4.0\/learning\/api\/, 2021."},{"key":"e_1_3_2_1_10_1","volume-title":"https:\/\/pkg.go.dev\/k8s.io\/client-go\/tools\/cache","year":"2021","unstructured":"k8s.io\/client-go\/tools\/cache. https:\/\/pkg.go.dev\/k8s.io\/client-go\/tools\/cache , 2021 . k8s.io\/client-go\/tools\/cache. https:\/\/pkg.go.dev\/k8s.io\/client-go\/tools\/cache, 2021."},{"key":"e_1_3_2_1_11_1","volume-title":"https:\/\/kubernetes.io\/docs\/reference\/using-api\/api-concepts","author":"Kubernetes API","year":"2021","unstructured":"Kubernetes API Concepts . https:\/\/kubernetes.io\/docs\/reference\/using-api\/api-concepts , 2021 . Kubernetes API Concepts. https:\/\/kubernetes.io\/docs\/reference\/using-api\/api-concepts, 2021."},{"key":"e_1_3_2_1_12_1","volume-title":"https:\/\/kubernetes.io\/docs\/concepts\/overview\/components\/","author":"Kubernetes Components","year":"2021","unstructured":"Kubernetes Components . https:\/\/kubernetes.io\/docs\/concepts\/overview\/components\/ , 2021 . Kubernetes Components. https:\/\/kubernetes.io\/docs\/concepts\/overview\/components\/, 2021."},{"key":"e_1_3_2_1_13_1","volume-title":"https:\/\/github.com\/instaclustr\/cassandra-operator","author":"Kubernetes Operator","year":"2021","unstructured":"Kubernetes Operator for Cassandra. https:\/\/github.com\/instaclustr\/cassandra-operator , 2021 . Kubernetes Operator for Cassandra. https:\/\/github.com\/instaclustr\/cassandra-operator, 2021."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.5555\/3026877.3026890"},{"key":"e_1_3_2_1_15_1","unstructured":"Brooker M. The Fundamental Mechanism of Scaling. http:\/\/brooker.co.za\/blog\/2021\/01\/22\/cloud-scale.html 2020.  Brooker M. The Fundamental Mechanism of Scaling. http:\/\/brooker.co.za\/blog\/2021\/01\/22\/cloud-scale.html 2020."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.5555\/1267308.1267332"},{"key":"e_1_3_2_1_17_1","volume-title":"Jan.","author":"Cassandra","year":"2021","unstructured":"Cassandra -operator-398. Reconcile() fails to delete the corresponding pvc if missing deletionTimestamp of Cassandra pod. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/398 , Jan. 2021 . Cassandra-operator-398. Reconcile() fails to delete the corresponding pvc if missing deletionTimestamp of Cassandra pod. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/398, Jan. 2021."},{"key":"e_1_3_2_1_18_1","volume-title":"Jan.","author":"Cassandra 0.","year":"2021","unstructured":"Cassandra -operator-40 0. Cassandra node can be decommissioned wrongly which blocks scale down. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/400 , Jan. 2021 . Cassandra-operator-400. Cassandra node can be decommissioned wrongly which blocks scale down. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/400, Jan. 2021."},{"key":"e_1_3_2_1_19_1","volume-title":"Jan.","author":"Cassandra","year":"2021","unstructured":"Cassandra -operator-402. PVC can be accidentally deleted when controller reads stale data from apiserver. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/402 , Jan. 2021 . Cassandra-operator-402. PVC can be accidentally deleted when controller reads stale data from apiserver. https:\/\/github.com\/instaclustr\/cassandra-operator\/issues\/402, Jan. 2021."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3324884.3416548"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/3129633.3129648"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/1993806.1993834"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/74851.74870"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/2043556.2043582"},{"key":"e_1_3_2_1_25_1","volume-title":"Oct.","year":"2010","unstructured":"HBASE-3136. Stale reads from ZK can break the atomic CAS operations we have in ZKAssign. https:\/\/issues.apache.org\/jira\/browse\/HBASE-3136 , Oct. 2010 . HBASE-3136. Stale reads from ZK can break the atomic CAS operations we have in ZKAssign. https:\/\/issues.apache.org\/jira\/browse\/HBASE-3136, Oct. 2010."},{"key":"e_1_3_2_1_26_1","volume-title":"Oct.","year":"2010","unstructured":"HBASE-3137. Optimize CAS operations in ZKAssign by being optimistic rather than always doing a sync(). https:\/\/issues.apache.org\/jira\/browse\/HBASE-3137 , Oct. 2010 . HBASE-3137. Optimize CAS operations in ZKAssign by being optimistic rather than always doing a sync(). https:\/\/issues.apache.org\/jira\/browse\/HBASE-3137, Oct. 2010."},{"key":"e_1_3_2_1_27_1","volume-title":"Apr.","year":"2012","unstructured":"HBASE-575. Region sever looking for master forever with cached stale data. https:\/\/issues.apache.org\/jira\/browse\/HBASE-5755 , Apr. 2012 . HBASE-575. Region sever looking for master forever with cached stale data. https:\/\/issues.apache.org\/jira\/browse\/HBASE-5755, Apr. 2012."},{"key":"e_1_3_2_1_28_1","volume-title":"Apr.","year":"2017","unstructured":"HDFS-11708. Positional read will fail if replicas moved to different DNs after stream is opened. https:\/\/issues.apache.org\/jira\/browse\/HDFS-11708 , Apr. 2017 . HDFS-11708. Positional read will fail if replicas moved to different DNs after stream is opened. https:\/\/issues.apache.org\/jira\/browse\/HDFS-11708, Apr. 2017."},{"key":"e_1_3_2_1_29_1","volume-title":"Oct.","year":"2013","unstructured":"HDFS-5322. HDFS delegation token not found in cache errors seen on secure HA clusters. https:\/\/issues.apache.org\/jira\/browse\/HDFS-5322 , Oct. 2013 . HDFS-5322. HDFS delegation token not found in cache errors seen on secure HA clusters. https:\/\/issues.apache.org\/jira\/browse\/HDFS-5322, Oct. 2013."},{"key":"e_1_3_2_1_30_1","first-page":"9","volume":"63","author":"Hellerstein J. M.","year":"2020","unstructured":"Hellerstein , J. M. , and Alvaro , P. Keeping CALM: When Distributed Consistency is Easy. Communications of the ACM 63 , 9 ( Sept. 2020 ), 72--81. Hellerstein, J. M., and Alvaro, P. Keeping CALM: When Distributed Consistency is Easy. Communications of the ACM 63, 9 (Sept. 2020), 72--81.","journal-title":"Easy. Communications of the ACM"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/78969.78972"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.5555\/1972457.1972488"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.5555\/1855840.1855851"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/1243418.1243426"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/1273442.1250755"},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the 46th International Conference on Very Large Data Bases (VLDB'20)","author":"Kingsbury K.","year":"2020","unstructured":"Kingsbury , K. , and Alvaro , P . Elle: Inferring Isolation Anomalies from Experimental Observations . In Proceedings of the 46th International Conference on Very Large Data Bases (VLDB'20) ( Aug. 2020 ). Kingsbury, K., and Alvaro, P. Elle: Inferring Isolation Anomalies from Experimental Observations. In Proceedings of the 46th International Conference on Very Large Data Bases (VLDB'20) (Aug. 2020)."},{"key":"e_1_3_2_1_37_1","volume-title":"Aug.","author":"Kubernetes","year":"2016","unstructured":"Kubernetes -30698. Make it possible to write a sound client from a distributed-systems perspective. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/30698 , Aug. 2016 . Kubernetes-30698. Make it possible to write a sound client from a distributed-systems perspective. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/30698, Aug. 2016."},{"key":"e_1_3_2_1_38_1","volume-title":"Nov.","author":"Kubernetes","year":"2017","unstructured":"Kubernetes -56261. Scheduler should delete a node from its cache if it gets \"node not found\" error. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/56261 , Nov. 2017 . Kubernetes-56261. Scheduler should delete a node from its cache if it gets \"node not found\" error. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/56261, Nov. 2017."},{"key":"e_1_3_2_1_39_1","volume-title":"Feb.","author":"Kubernetes","year":"2018","unstructured":"Kubernetes -59848. Kubernetes is vulnerable to stale reads, violating critical pod safety guarantees. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/59848 , Feb. 2018 . Kubernetes-59848. Kubernetes is vulnerable to stale reads, violating critical pod safety guarantees. https:\/\/github.com\/kubernetes\/kubernetes\/issues\/59848, Feb. 2018."},{"key":"e_1_3_2_1_40_1","volume-title":"Jan.","author":"Kubernetes","year":"2021","unstructured":"Kubernetes -website-26064. Clarify \"resource-Version unset\" semantics in Watch. https:\/\/github.com\/kubernetes\/website\/issues\/26064 , Jan. 2021 . Kubernetes-website-26064. Clarify \"resource-Version unset\" semantics in Watch. https:\/\/github.com\/kubernetes\/website\/issues\/26064, Jan. 2021."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.5555\/2685048.2685080"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3341301.3359638"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037735"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/3296957.3177161"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3341301.3359645"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/3158134"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.5555\/2643634.2643666"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3276530"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.5555\/2685048.2685082"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/2465351.2465386"},{"key":"e_1_3_2_1_51_1","volume-title":"Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20)","author":"Sun X.","year":"2020","unstructured":"Sun , X. , Cheng , R. , Chen , J. , Ang , E. , Legunsen , O. , and Xu , T . Testing Configuration Changes in Context to Prevent Production Failures . In Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20) ( Nov. 2020 ). Sun, X., Cheng, R., Chen, J., Ang, E., Legunsen, O., and Xu, T. Testing Configuration Changes in Context to Prevent Production Failures. In Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20) (Nov. 2020)."},{"key":"e_1_3_2_1_52_1","volume-title":"Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20)","author":"Tan C.","year":"2020","unstructured":"Tan , C. , Zhao , C. , Mu , S. , and Walfish , M . Cobra: Making Transactional Key-Value Stores Verifiably Serializable . In Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20) ( Nov. 2020 ). Tan, C., Zhao, C., Mu, S., and Walfish, M. Cobra: Making Transactional Key-Value Stores Verifiably Serializable. In Proceedings of the 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20) (Nov. 2020)."},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/2815400.2815401"},{"key":"e_1_3_2_1_54_1","volume-title":"Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation (OSDI'20)","author":"Tang C.","year":"2020","unstructured":"Tang , C. , Yu , K. , Veeraraghavan , K. , Kaldor , J. , Michelson , S. , Kooburat , T. , Anbudurai , A. , Clark , M. , Gogia , K. , Cheng , L. , Christensen , B. , Gartrell , A. , Khutornenko , M. , Kulkarni , S. , Pawlowski , M. , Pelkonen , T. , Rodrigues , A. , Tibrewal , R. , Venkatesan , V. , and Zhang , P . Twine: A Unified Cluster Management System for Shared Infrastructure . In Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation (OSDI'20) ( Nov. 2020 ). Tang, C., Yu, K., Veeraraghavan, K., Kaldor, J., Michelson, S., Kooburat, T., Anbudurai, A., Clark, M., Gogia, K., Cheng, L., Christensen, B., Gartrell, A., Khutornenko, M., Kulkarni, S., Pawlowski, M., Pelkonen, T., Rodrigues, A., Tibrewal, R., Venkatesan, V., and Zhang, P. Twine: A Unified Cluster Management System for Shared Infrastructure. In Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation (OSDI'20) (Nov. 2020)."},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/2492007.2492022"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/2741948.2741964"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.5555\/1558977.1558993"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.5555\/1558977.1558992"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.5555\/1267308.1267318"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378484"}],"event":{"name":"HotOS '21: Workshop on Hot Topics in Operating Systems","location":"Ann Arbor Michigan","acronym":"HotOS '21","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems"]},"container-title":["Proceedings of the Workshop on Hot Topics in Operating Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3458336.3465276","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3458336.3465276","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3458336.3465276","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:28:19Z","timestamp":1750195699000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3458336.3465276"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6]]},"references-count":60,"alternative-id":["10.1145\/3458336.3465276","10.1145\/3458336"],"URL":"https:\/\/doi.org\/10.1145\/3458336.3465276","relation":{},"subject":[],"published":{"date-parts":[[2021,6]]},"assertion":[{"value":"2021-06-03","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}