{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,14]],"date-time":"2025-10-14T05:44:02Z","timestamp":1760420642150,"version":"build-2065373602"},"reference-count":23,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T00:00:00Z","timestamp":1747958400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T00:00:00Z","timestamp":1747958400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006190","name":"Research and Development","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006190","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,5,23]]},"DOI":"10.1109\/icmlt65785.2025.11193392","type":"proceedings-article","created":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T17:39:05Z","timestamp":1760377145000},"page":"373-382","source":"Crossref","is-referenced-by-count":0,"title":["AD-KFAC: Asynchronous Decentralized Distributed K-FAC with Dynamic Load Balancing and Fault Tolerance"],"prefix":"10.1109","author":[{"given":"Mingzhe","family":"Yu","sequence":"first","affiliation":[{"name":"University of Tsukuba,Graduate School of Science and Technology,Tsukuba,Japan"}]},{"given":"Osamu","family":"Tatebe","sequence":"additional","affiliation":[{"name":"University of Tsukuba,Center for Computational Sciences,Tsukuba,Japan"}]}],"member":"263","reference":[{"key":"ref1","first-page":"2408","article-title":"Optimizing neural networks with kronecker-factored approximate curvature","volume-title":"Proceedings of the 32nd International Conference on Machine Learning, ICML 2015, Lille, France, 6-11 July 2015","volume":"37","author":"Martens"},{"key":"ref2","first-page":"573","article-title":"A kronecker-factored approximate fisher matrix for convolution layers","volume-title":"Proceedings of the 33nd International Conference on Machine Learning, ICML 2016, New York City, NY, USA, June 19-24, 2016","volume":"48","author":"Grosse"},{"article-title":"Kronecker-factored curvature approximations for recurrent neural networks","volume-title":"6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings","author":"Martens","key":"ref3"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403265"},{"key":"ref5","article-title":"Second-order optimization method for large mini-batch: Training resnet-50 on imagenet in 35 epochs","volume-title":"CoRR","volume":"abs\/1811.12019","author":"Osawa","year":"2018"},{"key":"ref6","first-page":"12 359","article-title":"Large-scale distributed second-order optimization using kronecker-factored approximate curvature for deep convolutional neural networks","volume-title":"IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2019, Long Beach, CA, USA, June 16-20, 2019.","author":"Osawa"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/sc41405.2020.00098"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/infocom53939.2023.10228871"},{"key":"ref9","article-title":"Pipefisher: Efficient training of large language models using pipelining and fisher information matrices","volume-title":"CoRR","volume":"abs\/2211.14133","author":"Osawa","year":"2022"},{"key":"ref10","first-page":"3049","article-title":"Asynchronous decentralized parallel stochastic gradient descent","volume-title":"Proceedings of the 35th International Conference on Machine Learning, ICML 2018, Stockholmsm\u00e4ssan, Stockholm, Sweden, July 10-15, 2018","volume":"80","author":"Lian"},{"article-title":"SWIFT: rapid decentralized federated learning via wait-free model communication","volume-title":"The Eleventh International Conference on Learning Representations, ICLR 2023, Kigali, Rwanda, May 1-5, 2023","author":"Bornstein","key":"ref11"},{"article-title":"Distributed second-order optimization using kronecker-factored approximations","volume-title":"5th International Conference on Learning Representations, ICLR 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings","author":"Ba","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476152"},{"key":"ref14","first-page":"64","article-title":"Asynchronous SGD on graphs: a unified framework for asynchronous decentralized and federated optimization","volume-title":"International Conference on Artificial Intelligence and Statistics, 2-4 May 2024, Palau de Congressos, Valencia, Spain","volume":"238","author":"Even"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611978032.95"},{"key":"ref16","first-page":"13 975","article-title":"Exponential graph is provably efficient for decentralized deep training","volume-title":"Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual","author":"Ying"},{"key":"ref17","first-page":"7202","article-title":"Distributed learning over unreliable networks","volume-title":"Proceedings of the 36th International Conference on Machine Learning, ICML 2019, 9-15 June 2019, Long Beach, California, USA","volume":"97","author":"Yu"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2023.02.025"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/tcc.2022.3205918"},{"key":"ref20","first-page":"305","article-title":"In search of an understandable consensus algorithm","volume-title":"Proceedings of the 2014 USENIX Annual Technical Conference, USENIX ATC 2014, Philadelphia, PA, USA, June 19-20, 2014","author":"Ongaro"},{"issue":"12","key":"ref21","first-page":"3005","article-title":"Pytorch distributed: Experiences on accelerating data parallel training","volume-title":"Proc. VLDB Endow","volume":"13","author":"Li"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2016.90"},{"article-title":"Fedavg with fine tuning: Local updates lead to representation learning","volume-title":"Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022","author":"Collins","key":"ref23"}],"event":{"name":"2025 10th International Conference on Machine Learning Technologies (ICMLT)","start":{"date-parts":[[2025,5,23]]},"location":"Helsinki, Finland","end":{"date-parts":[[2025,5,25]]}},"container-title":["2025 10th International Conference on Machine Learning Technologies (ICMLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11192828\/11192850\/11193392.pdf?arnumber=11193392","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,14]],"date-time":"2025-10-14T05:09:16Z","timestamp":1760418556000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11193392\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,23]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/icmlt65785.2025.11193392","relation":{},"subject":[],"published":{"date-parts":[[2025,5,23]]}}}