{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,18]],"date-time":"2025-11-18T01:34:26Z","timestamp":1763429666589,"version":"3.28.0"},"reference-count":40,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,7]]},"DOI":"10.1109\/infocom41043.2020.9155448","type":"proceedings-article","created":{"date-parts":[[2020,8,4]],"date-time":"2020-08-04T18:29:35Z","timestamp":1596565775000},"page":"139-148","source":"Crossref","is-referenced-by-count":15,"title":["Machine Learning on Volatile Instances"],"prefix":"10.1109","author":[{"given":"Xiaoxi","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jianyu","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gauri","family":"Joshi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Carlee","family":"Joe-Wong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","article-title":"Linear convergence of gradient and proximal-gradient methods under the polyak-ojasiewicz condition","author":"karimi","year":"2016","journal-title":"Proc of ECML PKDD"},{"key":"ref38","article-title":"Tensorflow: A system for large-scale machine learning","author":"abadi","year":"2016","journal-title":"Proceedings of USENIX OSDI"},{"key":"ref33","article-title":"Revisiting distributed synchronous sgd","author":"chen","year":"2016","journal-title":"ICLR Workshop Track"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.14778\/2732967.2732973"},{"article-title":"Adaptive communication strategies to achieve the best error-runtime trade-off in local-update SGD","year":"0","author":"wang","key":"ref31"},{"year":"0","key":"ref30","article-title":"How spot instances work"},{"key":"ref37","article-title":"Ray: A distributed framework for emerging ai applications","author":"moritz","year":"2018","journal-title":"Proceedings of USENIX OSDI"},{"key":"ref36","article-title":"Imagenet classification with deep convolutional neural networks","author":"alex krizhevsky","year":"2012","journal-title":"Proceedings of NIPS"},{"article-title":"Deep residual learning for image recognition","year":"2015","author":"he","key":"ref35"},{"key":"ref34","article-title":"On the computation and communication complexity of parallel sgd with dynamic batch sizes for stochastic non-convex optimization","author":"yu","year":"2019","journal-title":"Proc of ICML"},{"key":"ref10","article-title":"Federated learning: Strategies for improving communication efficiency","author":"kone?ny","year":"2016","journal-title":"arXiv preprint arXiv 1610 05492"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.1972.10482404"},{"key":"ref11","article-title":"esgd: Communication efficient distributed deep learning on the edge","author":"tao","year":"2018","journal-title":"Proceedings of USENIX Workshop on Hot Topics in Edge Computing (HotEdge 18)"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/2785956.2787473"},{"article-title":"The cifar-10 dataset","year":"0","author":"krizhevsky","key":"ref13"},{"key":"ref14","article-title":"How not to bid the cloud","author":"sharma","year":"2016","journal-title":"USENIX Conference on Hot Topics in Cloud Computing (HotCloud)"},{"key":"ref15","first-page":"165","article-title":"Optimal distributed online prediction using mini-batches","volume":"13","author":"ofer dekel","year":"2012","journal-title":"Journal of Machine Learning Research"},{"key":"ref16","first-page":"1000","article-title":"Communication-efficient distributed optimization using an approximate newton-type method","author":"shamir","year":"2014","journal-title":"International Conference on Machine Learning"},{"key":"ref17","article-title":"Efficient decentralized deep learning by dynamic model averaging","author":"kamp","year":"2018","journal-title":"arXiv preprint arXiv 1807 03210"},{"article-title":"Communication-efficient learning of deep networks from decentralized data","year":"0","author":"mcmahan","key":"ref18"},{"key":"ref19","article-title":"Slow and stale gradients can win the race: Error-runtime trade-offs in distributed sgd","author":"dutta","year":"2018","journal-title":"Proceedings of AISTATS"},{"journal-title":"Probability Density Functions","year":"0","key":"ref28"},{"year":"2019","key":"ref4","article-title":"Amazon ec2 spot instances"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/2408776.2408794"},{"key":"ref3","first-page":"1223","article-title":"Large scale distributed deep networks","volume":"1","author":"d","year":"2012","journal-title":"International Conference on Neural Information Processing Systems (NIPS)"},{"year":"2018","key":"ref6","article-title":"Announcing low-priority vms on scale sets now in public preview"},{"journal-title":"Cumulative distribution function","year":"0","key":"ref29"},{"year":"2019","key":"ref5","article-title":"Preemptible virtual machines"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2016.96"},{"year":"2019","key":"ref7","article-title":"Spot price overrides"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"key":"ref9","article-title":"Characterizing curtailed and uneconomic renewable power in the mid-continent independent system operator","author":"chien","year":"2016","journal-title":"arXiv preprint arXiv 1702 05464"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177729586"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1137\/16M1080173"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CLOUD.2012.59"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3310336"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CLOUD.2017.21"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3064176.3064182"},{"journal-title":"Convex optimization","year":"2014","author":"boyd","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/2987550.2987576"}],"event":{"name":"IEEE INFOCOM 2020 - IEEE Conference on Computer Communications","start":{"date-parts":[[2020,7,6]]},"location":"Toronto, ON, Canada","end":{"date-parts":[[2020,7,9]]}},"container-title":["IEEE INFOCOM 2020 - IEEE Conference on Computer Communications"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9146503\/9155217\/09155448.pdf?arnumber=9155448","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,28]],"date-time":"2022-06-28T17:55:40Z","timestamp":1656438940000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9155448\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7]]},"references-count":40,"URL":"https:\/\/doi.org\/10.1109\/infocom41043.2020.9155448","relation":{},"subject":[],"published":{"date-parts":[[2020,7]]}}}