{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,17]],"date-time":"2026-01-17T22:23:37Z","timestamp":1768688617008,"version":"3.49.0"},"reference-count":106,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,29]],"date-time":"2024-06-29T00:00:00Z","timestamp":1719619200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,29]],"date-time":"2024-06-29T00:00:00Z","timestamp":1719619200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006190","name":"Research and Development","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006190","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002367","name":"Chinese Academy of Sciences","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100002367","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100004358","name":"Samsung","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004358","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,29]]},"DOI":"10.1109\/isca59077.2024.00071","type":"proceedings-article","created":{"date-parts":[[2024,8,1]],"date-time":"2024-08-01T17:38:44Z","timestamp":1722533924000},"page":"915-930","source":"Crossref","is-referenced-by-count":6,"title":["Flagger: Cooperative Acceleration for Large-Scale Cross-Silo Federated Learning Aggregation"],"prefix":"10.1109","author":[{"given":"Xiurui","family":"Pan","sequence":"first","affiliation":[{"name":"Peking University,Computer Hardware and System Evolution Laboratory"}]},{"given":"Yuda","family":"An","sequence":"additional","affiliation":[{"name":"Peking University,Computer Hardware and System Evolution Laboratory"}]},{"given":"Shengwen","family":"Liang","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology,Chinese Academy of Sciences"}]},{"given":"Bo","family":"Mao","sequence":"additional","affiliation":[{"name":"Xiamen University"}]},{"given":"Mingzhe","family":"Zhang","sequence":"additional","affiliation":[{"name":"Institute of Information Engineering,Chinese Academy of Sciences"}]},{"given":"Qiao","family":"Li","sequence":"additional","affiliation":[{"name":"Xiamen University"}]},{"given":"Myoungsoo","family":"Jung","sequence":"additional","affiliation":[{"name":"KAIST and Panmnesia"}]},{"given":"Jie","family":"Zhang","sequence":"additional","affiliation":[{"name":"Peking University,Computer Hardware and System Evolution Laboratory"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Shakespere dataset"},{"key":"ref2","article-title":"Regulation (eu) 2016\/679 of the european parliament and of the council of 27 april 2016 on the protection of natural persons with regard to the processing of personal data and on the free movement of such data, and repealing directive 95\/46\/ec (general data protection regulation)","year":"2016"},{"key":"ref3","article-title":"Cybersecurity law of the people\u2019s republic of china","year":"2017"},{"key":"ref4","article-title":"California consumer privacy act (ccpa)","year":"2018"},{"key":"ref5","article-title":"Greedy-ftl","year":"2019"},{"key":"ref6","article-title":"Nvm express nvm command set specification 1.0c","year":"2022"},{"key":"ref7","article-title":"FATE (federated ai technology enabler)","year":"2023"},{"key":"ref8","article-title":"The openssd project","year":"2023"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.2779266"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/DSD.2016.70"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2017.2787987"},{"key":"ref12","first-page":"387","article-title":"{FlashNeuron}:{SSD-Enabled}{Large-Batch} training of very deep neural networks","volume-title":"19th USENIX Conference on File and Storage Technologies (FAST 21)","author":"Bae"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2014.55"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3474366.3486926"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/SBAC-PAD55451.2022.00036"},{"key":"ref16","article-title":"Hyperion: A case for unified, self-hosting, zero-cpu data-processing units (dpus)","author":"Brunella","year":"2022","journal-title":"arXiv preprint arXiv:2205.08882"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/HCS52781.2021.9567066"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICT-DM52643.2021.9664035"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/2492101.1555371"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2022.3168538"},{"key":"ref21","article-title":"Haflo: Gpu-based acceleration for federated logistic regression","author":"Cheng","year":"2021","journal-title":"arXiv preprint arXiv:2107.13797"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3543622.3578888"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2021.106648"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3151670"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/12.277287"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3472456.3472469"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3007787.3001154"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.10.013"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.7906\/indecs.20.2.8"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/FPL53798.2021.00040"},{"key":"ref32","article-title":"Cross-silo federated learning: Challenges and opportunities","author":"Huang","year":"2022","journal-title":"arXiv preprint arXiv:2206.12949"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref34","article-title":"Intel paillier cryptosystem library","year":"2022"},{"key":"ref35","article-title":"Data plane development kit","year":"2023"},{"key":"ref36","first-page":"9","article-title":"Lambda fl: Serverless aggregation for federated learning","volume-title":"International Workshop on Trustable, Verifiable and Auditable Federated Learning","author":"Jayaram"},{"key":"ref37","article-title":"Flashe: Additively symmetric homomorphic encryption for cross-silo federated learning","author":"Jiang","year":"2021","journal-title":"arXiv preprint arXiv:2109.00675"},{"key":"ref38","first-page":"649","article-title":"{OpenExpress}: Fully hardware automated open research framework for future fast {NVMe} devices","volume-title":"2020 USENIX Annual Technical Conference (USENIX ATC 20)","author":"Jung"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1561\/2200000083"},{"key":"ref40","first-page":"241","article-title":"Designing a true {Direct-Access} file system with {DevFS}","volume-title":"16th USENIX Conference on File and Storage Technologies (FAST 18)","author":"Kannan"},{"key":"ref41","article-title":"A distributed and elastic aggregation service for scalable federated learning systems","author":"Khan","year":"2022","journal-title":"arXiv preprint arXiv:2204.07767"},{"key":"ref42","first-page":"275","article-title":"Rearchitecting the {TCP} stack for {I\/O-Offloaded} content delivery","volume-title":"20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)","author":"Kim"},{"key":"ref43","first-page":"219","article-title":"Summarizer: trading communication with computing near storage","volume-title":"Proceedings of the 50th Annual IEEE\/ACM International Symposium on Microarchitecture","author":"Koo"},{"key":"ref44","article-title":"Learning multiple layers of features from tiny images","author":"Krizhevsky","year":"2009"},{"key":"ref45","first-page":"367","article-title":"Mage: Nearly zero-cost virtual memory for secure computation","author":"Kumar","year":"2021","journal-title":"OSDI"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/3385073"},{"key":"ref47","first-page":"147","article-title":"{Hardware\/Software} {Co-Programmable} framework for computational {SSDs} to accelerate deep learning service on {Large-Scale} graphs","volume-title":"20th USENIX Conference on File and Storage Technologies (FAST 22)","author":"Kwon"},{"key":"ref48","first-page":"741","article-title":"{ATP}: In-network aggregation for multi-tenant learning","volume-title":"18th USENIX Symposium on Networked Systems Design and Implementation (NSDI 21)","author":"Lao"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2020.3009347"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527391"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11223767"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527433"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.2172\/1783736"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TBDATA.2022.3190835"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/3450288"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2022.111357"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3219485"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1145\/3503222.3507702"},{"key":"ref59","first-page":"19478","article-title":"Throughput-optimal topology design for cross-silo federated learning","volume":"33","author":"Marfoq","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1145\/3544216.3544238"},{"key":"ref61","article-title":"Unvme - a user space nvme driver project","year":"2015"},{"key":"ref62","first-page":"77","article-title":"{AccelTCP}: Accelerating network applications with stateful {TCP} offloading","volume-title":"17th USENIX Symposium on Networked Systems Design and Implementation (NSDI 20)","author":"Moon"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1049\/iet-cdt.2015.0055"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/FPGA.2002.1106687"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-48910-X_16"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/ICTC55196.2022.9952531"},{"key":"ref67","article-title":"Effect of homomorphic encryption on the performance of training federated learning generative adversarial networks","author":"Pejic","year":"2022","journal-title":"arXiv preprint arXiv:2207.00263"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.17487\/rfc0879"},{"key":"ref69","first-page":"379","article-title":"{INSIDER}: Designing {In-Storage} computing system for emerging {High-Performance} drive","volume-title":"2019 USENIX Annual Technical Conference (USENIX ATC 19","author":"Ruan"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480070"},{"key":"ref71","article-title":"Insights into privacy-preserving federated machine learning from the perspective of a national statistical office","author":"Santos","year":"2023"},{"key":"ref72","first-page":"10533","article-title":"Dres-fl: Dropout-resilient secure federated learning for non-iid clients via secret data sharing","volume":"35","author":"Shao","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref73","first-page":"87","article-title":"{FlexTOE}: Flexible {TCP} offload with {Fine-Grained} parallelism","volume-title":"19th USENIX Symposium on Networked Systems Design and Implementation (NSDI 22)","author":"Shashidhara"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/HCS59251.2023.10254692"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC42615.2023.10067522"},{"key":"ref76","article-title":"A case for offloading federated learning server on smart nic","author":"Shibahara","year":"2023","journal-title":"arXiv preprint arXiv:2307.06561"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2016.7577319"},{"key":"ref78","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014","journal-title":"arXiv preprint arXiv:1409.1556"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/MSE.2007.44"},{"key":"ref80","first-page":"6105","article-title":"Efficientnet: Rethinking model scaling for convolutional neural networks","volume-title":"International conference on machine learning","author":"Tan"},{"key":"ref81","article-title":"Daisyplus pcie nvme storage accelerator","author":"Technology","year":"2021"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1145\/3510033"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378528"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2019.09.010"},{"key":"ref85","first-page":"967","article-title":"{FpgaNIC} An {FPGA-based} versatile 100gb {SmartNIC} for {GPUs}","volume-title":"2022 USENIX Annual Technical Conference (USENIX ATC 22)","author":"Wang"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM42981.2021.9488756"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3206785"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2020.2988575"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1145\/3445814.3446763"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysarc.2013.12.002"},{"key":"ref91","article-title":"Fashion-mnist: a novel image dataset for benchmarking machine learning algorithms","author":"Xiao","year":"2017","journal-title":"arXiv preprint arXiv:1708.07747"},{"key":"ref92","article-title":"Alveo u55c high performance compute card","year":"2021"},{"key":"ref93","article-title":"Vitis software platform release notes","year":"2021"},{"key":"ref94","article-title":"Ultrascale+ integrated 100g ethernet subsystem","year":"2023"},{"key":"ref95","article-title":"Xilinx runtime library (xrt)","year":"2023"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.02020"},{"key":"ref97","article-title":"Fpga-based hardware accelerator of homomorphic encryption for efficient federated learning","author":"Yang","year":"2020","journal-title":"arXiv preprint arXiv:2007.10560"},{"key":"ref98","first-page":"347","article-title":"\u03bb-IO: A unified {IO} stack for computational storage","volume-title":"21st USENIX Conference on File and Storage Technologies (FAST 23)","author":"Yang"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1162\/neco_a_01199"},{"key":"ref100","article-title":"A smartnic-based secure aggregation scheme for federated learning","author":"Zang","year":"2022"},{"key":"ref101","article-title":"Batchcrypt: Efficient homomorphic encryption for cross-silo federated learning","volume-title":"Proceedings of the 2020 USENIX Annual Technical Conference (USENIX ATC 2020)","author":"Zhang"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00090"},{"key":"ref103","first-page":"1057","article-title":"{FLASH}: Towards a high-performance hardware acceleration architecture for cross-silo federated learning","volume-title":"20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)","author":"Zhang"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2017.01.026"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1145\/2741948.2741949"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1186\/s12911-019-0913-x"}],"event":{"name":"2024 ACM\/IEEE 51st Annual International Symposium on Computer Architecture (ISCA)","location":"Buenos Aires, Argentina","start":{"date-parts":[[2024,6,29]]},"end":{"date-parts":[[2024,7,3]]}},"container-title":["2024 ACM\/IEEE 51st Annual International Symposium on Computer Architecture (ISCA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10609566\/10609567\/10609633.pdf?arnumber=10609633","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,3]],"date-time":"2024-08-03T05:25:55Z","timestamp":1722662755000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10609633\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,29]]},"references-count":106,"URL":"https:\/\/doi.org\/10.1109\/isca59077.2024.00071","relation":{},"subject":[],"published":{"date-parts":[[2024,6,29]]}}}