{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T05:17:27Z","timestamp":1751606247465,"version":"3.28.0"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,9,22]]},"DOI":"10.1109\/hpec43674.2020.9286180","type":"proceedings-article","created":{"date-parts":[[2020,12,22]],"date-time":"2020-12-22T21:07:15Z","timestamp":1608671235000},"page":"1-7","source":"Crossref","is-referenced-by-count":7,"title":["Layer-Parallel Training with GPU Concurrency of Deep Residual Neural Networks via Nonlinear Multigrid"],"prefix":"10.1109","author":[{"given":"Andrew","family":"Kirby","sequence":"first","affiliation":[]},{"given":"Siddharth","family":"Samsi","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Jones","sequence":"additional","affiliation":[]},{"given":"Albert","family":"Reuther","sequence":"additional","affiliation":[]},{"given":"Jeremy","family":"Kepner","sequence":"additional","affiliation":[]},{"given":"Vijay","family":"Gadepally","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"6571","article-title":"Neural ordinary differential equations","author":"chen","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.2514\/3.25233"},{"key":"ref12","first-page":"129","article-title":"Multigrid Techniques for Unstructured Mesh","volume":"5","author":"mavriplis","year":"1995","journal-title":"Numerical Methods for Fluid Dynamics"},{"journal-title":"Multilevel Minimization for Deep Residual Networks","year":"2020","author":"gaedke-merzhauser","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1137\/19M1247620"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/1365490.1365500"},{"journal-title":"cuDNN Efficient Primitives for Deep Learning","year":"2014","author":"chetlur","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1137\/130944230"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1137\/16M1074096"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1137\/130944230"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1126\/science.aam9744"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2017.57"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"journal-title":"AI and Compute","year":"2018","author":"amodei","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2019.8916416"},{"journal-title":"Ai enabling technologies A survey","year":"2019","author":"gadepally","key":"ref7"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2019.8916327"},{"journal-title":"Beyond finite layer neural networks Bridging deep architectures and numerical differential equations","year":"2017","author":"lu","key":"ref9"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3320060"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/s00791-017-0283-9"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/7056.001.0001"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1080\/10556788.2018.1504050"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2018.8547629"},{"journal-title":"Megatron-lm Training multi-billion parameter language models using gpu model parallelism","year":"2019","author":"shoeybi","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-05083-6_5"}],"event":{"name":"2020 IEEE High Performance Extreme Computing Conference (HPEC)","start":{"date-parts":[[2020,9,22]]},"location":"Waltham, MA, USA","end":{"date-parts":[[2020,9,24]]}},"container-title":["2020 IEEE High Performance Extreme Computing Conference (HPEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9285977\/9286137\/09286180.pdf?arnumber=9286180","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T15:54:01Z","timestamp":1656345241000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9286180\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,9,22]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/hpec43674.2020.9286180","relation":{},"subject":[],"published":{"date-parts":[[2020,9,22]]}}}