{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,25]],"date-time":"2026-01-25T16:05:45Z","timestamp":1769357145894,"version":"3.49.0"},"reference-count":47,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"11","license":[{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2016YFB1000403"],"award-info":[{"award-number":["2016YFB1000403"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Parallel Distrib. Syst."],"published-print":{"date-parts":[[2022,11,1]]},"DOI":"10.1109\/tpds.2022.3145163","type":"journal-article","created":{"date-parts":[[2022,1,25]],"date-time":"2022-01-25T20:28:30Z","timestamp":1643142510000},"page":"2846-2859","source":"Crossref","is-referenced-by-count":21,"title":["Bridging the Gap between Deep Learning and Frustrated Quantum Spin System for Extreme-Scale Simulations on New Generation of Sunway Supercomputer"],"prefix":"10.1109","volume":"33","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1079-3126","authenticated-orcid":false,"given":"Mingfan","family":"Li","sequence":"first","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6487-3658","authenticated-orcid":false,"given":"Junshi","family":"Chen","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qian","family":"Xiao","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fei","family":"Wang","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qingcai","family":"Jiang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuncheng","family":"Zhao","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rongfen","family":"Lin","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Technology, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3900-3722","authenticated-orcid":false,"given":"Hong","family":"An","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7882-3571","authenticated-orcid":false,"given":"Xiao","family":"Liang","sequence":"additional","affiliation":[{"name":"CAS Key Lab of Quantum Information, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2050-134X","authenticated-orcid":false,"given":"Lixin","family":"He","sequence":"additional","affiliation":[{"name":"CAS Key Lab of Quantum Information, University of Science and Technology of China, Hefei, Anhui, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476174"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476161"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevLett.95.100201"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/SC41405.2020.00018"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2018.2848618"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00068"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01264"},{"key":"ref36","article-title":"Scalable second order optimization for deep learning","author":"anil","year":"2020"},{"key":"ref35","first-page":"2408","article-title":"Optimizing neural networks with kronecker-factored approximate curvature","author":"martens","year":"2015","journal-title":"Proc IEEE Intern Conf on Machine Learning"},{"key":"ref34","first-page":"1842","article-title":"Shampoo: Preconditioned stochastic tensor optimization","author":"gupta","year":"2018","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1080\/00107514.2019.1579866"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476158"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevB.98.104426"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevB.103.035138"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevX.11.031034"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/FMPC.1992.234898"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.12693\/APhysPolA.97.979"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevResearch.2.033075"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-016-5588-7"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1093\/nsr\/nww044"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2021.3091408"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/SC41405.2020.00009"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1126\/science.aag2302"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356147"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/2063384.2063386"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3225058.3225069"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00054"},{"key":"ref5","article-title":"Scaling SGD batch size to 32K for ImageNet training","author":"you","year":"0"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevB.85.045103"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356137"},{"key":"ref2","first-page":"45-es","article-title":"Large-scale electronic structure calculations of high-Z metals on the bluegene\/L platform","author":"gygi","year":"2006","journal-title":"Proc ACM\/IEEE Conf Supercomput"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevLett.80.4558"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1103\/RevModPhys.71.1253"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevB.100.125124"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1214\/ss\/1177011137"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1063\/1.2746035"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevB.78.180410"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-020-15402-w"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2020.12.079"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.26599\/TST.2018.9010112"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3178487.3178495"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476137"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2017.20"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC\/SmartCity\/DSS.2019.00345"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/2491956.2462181"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.26599\/TST.2019.9010074"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3293883.3295716"}],"container-title":["IEEE Transactions on Parallel and Distributed Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/71\/9782123\/09693260.pdf?arnumber=9693260","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T20:23:45Z","timestamp":1656361425000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9693260\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11,1]]},"references-count":47,"journal-issue":{"issue":"11"},"URL":"https:\/\/doi.org\/10.1109\/tpds.2022.3145163","relation":{},"ISSN":["1045-9219","1558-2183","2161-9883"],"issn-type":[{"value":"1045-9219","type":"print"},{"value":"1558-2183","type":"electronic"},{"value":"2161-9883","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,11,1]]}}}