{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:56:24Z","timestamp":1763704584285,"version":"3.45.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,26]]},"DOI":"10.1109\/iccad66269.2025.11240876","type":"proceedings-article","created":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T18:39:34Z","timestamp":1763663974000},"page":"1-9","source":"Crossref","is-referenced-by-count":0,"title":["3D Acceleration for Mixture-of-Experts and Multi-Head Attention Spiking Transformers with Dynamic Head Pruning"],"prefix":"10.1109","author":[{"given":"Boxun","family":"Xu","sequence":"first","affiliation":[{"name":"University of California,Department of Electrical and Computer Engineering,Santa Barbara,CA,USA"}]},{"given":"Junyoung","family":"Hwang","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology,Department of Electrical and Computer Engineering,GA,USA"}]},{"given":"Pruek","family":"Vanna-Iampikul","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology,Department of Electrical and Computer Engineering,GA,USA"}]},{"given":"Yuxuan","family":"Yin","sequence":"additional","affiliation":[{"name":"University of California,Department of Electrical and Computer Engineering,Santa Barbara,CA,USA"}]},{"given":"Sung Kyu","family":"Lim","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology,Department of Electrical and Computer Engineering,GA,USA"}]},{"given":"Peng","family":"Li","sequence":"additional","affiliation":[{"name":"University of California,Department of Electrical and Computer Engineering,Santa Barbara,CA,USA"}]}],"member":"263","reference":[{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations","author":"Dosovitskiy","key":"ref1"},{"key":"ref2","first-page":"8821","article-title":"Zero-shot text-to-image generation","volume-title":"Proceedings of the 38th International Conference on Machine Learning","volume":"139","author":"Ramesh"},{"article-title":"Mistral 7b","year":"2023","author":"Jiang","key":"ref3"},{"key":"ref4","first-page":"4057","article-title":"Unified scaling laws for routed language models","volume-title":"International Conference on machine learning","author":"Clark"},{"key":"ref5","first-page":"8583","article-title":"Scaling vision with sparse mixture of experts","volume-title":"Advances in Neural Information Processing Systems","volume":"34","author":"Riquelme"},{"key":"ref6","first-page":"28 441","article-title":"M3vit: Mixture-of-experts vision transformer for efficient multitask learning with model-accelerator co-design","volume-title":"Advances in Neural Information Processing Systems","volume":"35","author":"Fan"},{"issue":"9","key":"ref7","first-page":"1659","article-title":"Networks of spiking neurons: The third generation of neural network models","volume-title":"Neural Networks","volume":"10","author":"Maass","year":"1997"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2015.2474396"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2018.112130359"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA53966.2022.00031"},{"article-title":"Spikformer: When spiking neural network meets transformer","volume-title":"The Eleventh International Conference on Learning Representations","author":"Zhou","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00860"},{"article-title":"Dista: Denoising spiking transformer with intrinsic plasticity and spatiotemporal attention","year":"2023","author":"Xu","key":"ref13"},{"article-title":"Spike-driven transformer","year":"2023","author":"Yao","key":"ref14"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD50377.2020.00027"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA53966.2022.00031"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/isca45697.2020.00038"},{"article-title":"Spikex: Exploring accelerator architecture and network-hardware co-optimization for sparse spiking neural networks","year":"2025","author":"Xu","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731063"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3676536.3676826"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/asap65064.2025.00016"},{"issue":"120","key":"ref22","first-page":"1","article-title":"Switch transformers: Scaling to trillion parameter models with simple and efficient sparsity","volume":"23","author":"Fedus","year":"2022","journal-title":"Journal of Machine Learning Research"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3658482"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00039"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC49657.2024.10454472"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3195970.3196024"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3240765.3264695"},{"key":"ref28","first-page":"22 137","article-title":"Deja vu: Contextual sparsity for efficient llms at inference time","volume-title":"International Conference on Machine Learning","author":"Liu"},{"article-title":"The cifar-10 dataset","year":"2014","author":"Krizhevsky","key":"ref29"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3400302.3415720"}],"event":{"name":"2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)","start":{"date-parts":[[2025,10,26]]},"location":"Munich, Germany","end":{"date-parts":[[2025,10,30]]}},"container-title":["2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11240608\/11240621\/11240876.pdf?arnumber=11240876","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:45:40Z","timestamp":1763703940000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11240876\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,26]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/iccad66269.2025.11240876","relation":{},"subject":[],"published":{"date-parts":[[2025,10,26]]}}}