{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,18]],"date-time":"2025-10-18T00:10:04Z","timestamp":1760746204474,"version":"build-2065373602"},"reference-count":33,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T00:00:00Z","timestamp":1757894400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T00:00:00Z","timestamp":1757894400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,9,15]]},"DOI":"10.1109\/hpec67600.2025.11196476","type":"proceedings-article","created":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T17:35:37Z","timestamp":1760636137000},"page":"1-8","source":"Crossref","is-referenced-by-count":0,"title":["Accelerating Sparse Deep Learning via Multi-Layer Tensor Reordering and Partitioning"],"prefix":"10.1109","author":[{"given":"Gunduz Vehbi","family":"Demirci","sequence":"first","affiliation":[{"name":"Wayve,London,UK"}]},{"given":"Cagatay","family":"Dikici","sequence":"additional","affiliation":[{"name":"Wayve,London,UK"}]},{"given":"Tim","family":"Atherton","sequence":"additional","affiliation":[{"name":"Imagination Technologies,London,UK"}]}],"member":"263","reference":[{"key":"ref1","first-page":"129","article-title":"What is the state of neural network pruning?","volume-title":"Proceedings of machine learning and systems","volume":"2","author":"Blalock"},{"article-title":"The state of sparsity in deep neural networks","year":"2019","author":"Gale","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2019.8916336"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.07.045"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298681"},{"key":"ref6","first-page":"17283","article-title":"Big bird: Transformers for longer sequences","volume":"33","author":"Zaheer","year":"2020","journal-title":"Advances in neural information processing systems"},{"article-title":"Efficient language modeling with sparse all-mlp","year":"2022","author":"Yu","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3020078.3021745"},{"key":"ref9","article-title":"Accelerating inference with sparsity using the nvidia ampere architecture and nvidia tensorrt","volume-title":"NVIDIA Developer Technical Blog","author":"Pool","year":"2021"},{"article-title":"Accelerating sparse deep neural networks","year":"2021","author":"Mishra","key":"ref10"},{"key":"ref11","first-page":"5533","article-title":"Inducing and exploiting activation sparsity for fast inference on deep neural networks","volume-title":"International Conference on Machine Learning","author":"Kurtz"},{"key":"ref12","first-page":"578","article-title":"{TVM}: An automated {End-to-End} optimizing compiler for deep learning","volume-title":"13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18)","author":"Chen"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-16808-1_33"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/S0025-5610(97)00009-9"},{"key":"ref15","article-title":"Hypergraph models for sparse matrix partitioning and reordering","volume-title":"Ph.D. dissertation","author":"\u00c7ataly\u00fcrek","year":"1999"},{"article-title":"Metis: A software package for partitioning unstructured graphs, partitioning meshes, and computing fill-reducing orderings of sparse matrices","year":"1997","author":"Karypis","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3329872"},{"article-title":"Selective brain damage: Measuring the disparate impact of model pruning","year":"2019","author":"Hooker","key":"ref18"},{"key":"ref19","first-page":"744","article-title":"Efficient gpu kernels for n:msparse weights in deep learning","volume-title":"Proceedings of Machine Learning and Systems (MLSys)","volume":"5","author":"Zheng"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2019.00051"},{"article-title":"Sparsednn: Fast sparse deep learning inference on cpus","year":"2021","author":"Wang","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3447818.3460372"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC49654.2021.9622791"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC43674.2020.9286206"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC43674.2020.9286154"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00961"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00319"},{"key":"ref28","first-page":"302","article-title":"Torchsparse: Efficient point cloud inference engine","volume-title":"Proceedings of Machine Learning and Systems","volume":"4","author":"Tang"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.3390\/s18103337"},{"article-title":"Pytorch pruning example","year":"2020","author":"Mao","key":"ref30"},{"year":"2025","key":"ref31","article-title":"SparseZoo model repository"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3529090"},{"year":"2023","key":"ref33","article-title":"IMG Series4 Neural Network Accelerator (NNA)"}],"event":{"name":"2025 IEEE High Performance Extreme Computing Conference (HPEC)","start":{"date-parts":[[2025,9,15]]},"location":"Wakefield, MA, USA","end":{"date-parts":[[2025,9,19]]}},"container-title":["2025 IEEE High Performance Extreme Computing Conference (HPEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11196085\/11196088\/11196476.pdf?arnumber=11196476","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,17]],"date-time":"2025-10-17T04:47:25Z","timestamp":1760676445000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11196476\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,15]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/hpec67600.2025.11196476","relation":{},"subject":[],"published":{"date-parts":[[2025,9,15]]}}}