{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T18:56:25Z","timestamp":1775069785954,"version":"3.50.1"},"reference-count":51,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"10","license":[{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"am","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"NSF","doi-asserted-by":"publisher","award":["2139304"],"award-info":[{"award-number":["2139304"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"NSF","doi-asserted-by":"publisher","award":["2007714"],"award-info":[{"award-number":["2007714"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100006754","name":"Army Research Laboratory","doi-asserted-by":"publisher","award":["W911NF-17-2-0196"],"award-info":[{"award-number":["W911NF-17-2-0196"]}],"id":[{"id":"10.13039\/100006754","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Inform. Theory"],"published-print":{"date-parts":[[2023,10]]},"DOI":"10.1109\/tit.2023.3284427","type":"journal-article","created":{"date-parts":[[2023,6,9]],"date-time":"2023-06-09T17:23:52Z","timestamp":1686331432000},"page":"6639-6670","source":"Crossref","is-referenced-by-count":12,"title":["Byzantine-Resilient High-Dimensional Federated Learning"],"prefix":"10.1109","volume":"69","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3544-8414","authenticated-orcid":false,"given":"Deepesh","family":"Data","sequence":"first","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of California at Los Angeles (UCLA), Los Angeles, CA, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7313-9861","authenticated-orcid":false,"given":"Suhas N.","family":"Diggavi","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of California at Los Angeles (UCLA), Los Angeles, CA, USA"}]}],"member":"263","reference":[{"key":"ref13","article-title":"On the convergence of FedAvg on non-IID data","author":"li","year":"2020","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref12","first-page":"4519","article-title":"Tighter theory for local SGD on identical and heterogeneous data","author":"khaled","year":"2020","journal-title":"Proc Int Conf Artif Intell Statist (AISTATS)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33015693"},{"key":"ref14","article-title":"Federated optimization in heterogeneous networks","author":"sahu","year":"2020","journal-title":"Proc Conf Mach Learn Syst (MLSys)"},{"key":"ref11","first-page":"5132","article-title":"SCAFFOLD: Stochastic controlled averaging for federated learning","author":"karimireddy","year":"2020","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref10","article-title":"On the convergence of local descent methods in federated learning","author":"haddadpour","year":"2019","journal-title":"arXiv 1910 14425"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3154503"},{"key":"ref16","first-page":"14668","article-title":"Qsparse-local-SGD: Distributed SGD with quantization, sparsification and local computations","author":"basu","year":"2019","journal-title":"Proc NeurIPS"},{"key":"ref19","first-page":"4618","article-title":"Byzantine stochastic gradient descent","author":"alistarh","year":"2018","journal-title":"Proc Neural Inf Process Syst (NeurIPS)"},{"key":"ref18","first-page":"5636","article-title":"Byzantine-robust distributed learning: Towards optimal statistical rates","author":"yin","year":"2018","journal-title":"Proc ICML"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT45174.2021.9518248"},{"key":"ref50","first-page":"2478","article-title":"Byzantine-resilient high-dimensional SGD with local iterations on heterogeneous data","volume":"139","author":"data","year":"2021","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref46","first-page":"8632","article-title":"A little is enough: Circumventing defenses for distributed learning","author":"baruch","year":"2019","journal-title":"Proc Neural Inf Process Syst (NeurIPS)"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1145\/3055399.3055491"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1137\/090772873"},{"key":"ref47","first-page":"3518","article-title":"The hidden vulnerability of distributed learning in Byzantium","author":"mhamdi","year":"2018","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref42","article-title":"Communication efficient decentralized training with multiple local updates","author":"li","year":"2019","journal-title":"arXiv 1910 091265"},{"key":"ref41","first-page":"7184","article-title":"On the linear speedup analysis of communication efficient momentum SGD for distributed non-convex optimization","author":"yu","year":"2019","journal-title":"Proc ICML"},{"key":"ref44","first-page":"6065","article-title":"Quantum entropy scoring for fast robust mean estimation and improved outlier detection","author":"dong","year":"2019","journal-title":"Proc Neural Inf Process Syst (NeurIPS)"},{"key":"ref43","author":"li","year":"2019","journal-title":"Robustness in Machine Learning (CSE 599-M) Lecture 5-Efficient Filtering From Spectral Signatures"},{"key":"ref49","article-title":"Introduction to the non-asymptotic analysis of random matrices","author":"vershynin","year":"2010","journal-title":"arXiv 1011 3027"},{"key":"ref8","first-page":"119","article-title":"Machine learning with adversaries: Byzantine tolerant gradient descent","author":"blanchard","year":"2017","journal-title":"Proc NIPS"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"key":"ref9","first-page":"11080","article-title":"Local SGD with periodic averaging: Tighter analysis and adaptive synchronization","author":"haddadpour","year":"2019","journal-title":"Proc Neural Inf Process Syst (NeurIPS)"},{"key":"ref4","first-page":"4615","article-title":"Agnostic federated learning","author":"mohri","year":"2019","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref3","first-page":"1273","article-title":"Communication-efficient learning of deep networks from decentralized data","author":"mcmahan","year":"2017","journal-title":"Proc Int Conf Artif Intell Statist (AISTATS)"},{"key":"ref6","article-title":"Advances and open problems in federated learning","author":"kairouz","year":"2019","journal-title":"arXiv 1912 04977"},{"key":"ref5","first-page":"1232","article-title":"Large scale distributed deep networks","author":"dean","year":"2012","journal-title":"Proc Neural Inf Process Syst (NIPS)"},{"key":"ref40","article-title":"Recent advances in algorithmic high-dimensional robust statistics","author":"diakonikolas","year":"2019","journal-title":"arXiv 1911 05911"},{"key":"ref35","article-title":"Byzantine-robust learning on heterogeneous datasets via bucketing","author":"karimireddy","year":"2022","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref34","article-title":"Byzantine-resilient non-convex stochastic gradient descent","author":"allen-zhu","year":"2021","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/FOCS.2016.76"},{"key":"ref36","first-page":"213","article-title":"SLSGD: Secure and efficient distributed on-device machine learning","author":"xie","year":"2019","journal-title":"Proc Eur Conf Mach Learn Knowl Discovery Databases"},{"key":"ref31","first-page":"5311","article-title":"Learning from history for Byzantine robust optimization","volume":"139","author":"karimireddy","year":"2021","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref30","article-title":"Robust federated learning in a heterogeneous environment","author":"ghosh","year":"2019","journal-title":"arXiv 1906 06629"},{"key":"ref33","first-page":"6246","article-title":"Byzantine machine learning made easy by resilient averaging of momentums","volume":"162","author":"farhadkhani","year":"2022","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref32","article-title":"Distributed momentum for Byzantine-resilient stochastic gradient descent","author":"mhamdi","year":"2021","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref2","article-title":"Federated optimization: Distributed machine learning for on-device intelligence","author":"konecn\u00fd","year":"2016","journal-title":"arXiv 1610 02527"},{"key":"ref1","article-title":"Stochastic, distributed and federated optimization for machine learning","author":"konecn\u00fd","year":"2017","journal-title":"arXiv 1707 01155"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1137\/17M1126680"},{"key":"ref38","first-page":"45:1","article-title":"Resilience: A criterion for learning in the presence of arbitrary outliers","author":"steinhardt","year":"2018","journal-title":"Proc ITC"},{"key":"ref24","first-page":"902","article-title":"DRACO: Byzantine-resilient distributed training via redundant gradients","author":"chen","year":"2018","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT44484.2020.9174363"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2019.8849857"},{"key":"ref25","first-page":"10320","article-title":"DETOX: A redundancy-based framework for faster and more robust gradient aggregation","author":"rajput","year":"2019","journal-title":"Proc NeurIPS"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3322205.3311083"},{"key":"ref22","first-page":"7074","article-title":"Defending against saddle point attack in Byzantine-robust distributed learning","author":"yin","year":"2019","journal-title":"Proc ICML"},{"key":"ref21","first-page":"6893","article-title":"Zeno: Distributed stochastic gradient descent with suspicion-based fault-tolerance","author":"xie","year":"2019","journal-title":"Proc Int Conf Mach Learn (ICML)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2020.3035868"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2019.8849217"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33011544"}],"container-title":["IEEE Transactions on Information Theory"],"original-title":[],"link":[{"URL":"https:\/\/ieeexplore.ieee.org\/ielam\/18\/10253618\/10147260-aam.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/18\/10253618\/10147260.pdf?arnumber=10147260","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,2]],"date-time":"2023-10-02T17:50:30Z","timestamp":1696269030000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10147260\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10]]},"references-count":51,"journal-issue":{"issue":"10"},"URL":"https:\/\/doi.org\/10.1109\/tit.2023.3284427","relation":{},"ISSN":["0018-9448","1557-9654"],"issn-type":[{"value":"0018-9448","type":"print"},{"value":"1557-9654","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,10]]}}}