{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T21:35:37Z","timestamp":1770932137396,"version":"3.50.1"},"reference-count":43,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100018537","name":"National Science and Technology Major Project","doi-asserted-by":"publisher","award":["2022ZD0115200"],"award-info":[{"award-number":["2022ZD0115200"]}],"id":[{"id":"10.13039\/501100018537","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62125403"],"award-info":[{"award-number":["62125403"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U24A20234"],"award-info":[{"award-number":["U24A20234"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["92464302"],"award-info":[{"award-number":["92464302"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U24B20164"],"award-info":[{"award-number":["U24B20164"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Beijing S&#x0026;T","award":["Z251100008425010"],"award-info":[{"award-number":["Z251100008425010"]}]},{"name":"Shanghai Municipal Science and Technology Major Project"},{"name":"Natural Science Foundation of Jiangsu Province Basic Research Program","award":["BK20243042"],"award-info":[{"award-number":["BK20243042"]}]},{"DOI":"10.13039\/501100017582","name":"Beijing National Research Center for Information Science and Technology","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100017582","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Northern IC Technology Innovation Center (Beijing) Company, Ltd.","award":["QYJS20232801B"],"award-info":[{"award-number":["QYJS20232801B"]}]},{"name":"Beijing Advanced Innovation Center for Integrated Circuits"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Comput."],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1109\/tc.2025.3648055","type":"journal-article","created":{"date-parts":[[2025,12,24]],"date-time":"2025-12-24T18:45:05Z","timestamp":1766601905000},"page":"1125-1140","source":"Crossref","is-referenced-by-count":0,"title":["Designing Spatial Architectures for Sparse Attention: STAR Accelerator via Cross-Stage Tiling"],"prefix":"10.1109","volume":"75","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9763-8208","authenticated-orcid":false,"given":"Huizheng","family":"Wang","sequence":"first","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-3501-3148","authenticated-orcid":false,"given":"Taiquan","family":"Wei","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-2383-8084","authenticated-orcid":false,"given":"Hongbin","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-7114-0647","authenticated-orcid":false,"given":"Zichuan","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-6038-3709","authenticated-orcid":false,"given":"Xinru","family":"Tang","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4084-3478","authenticated-orcid":false,"given":"Zhiheng","family":"Yue","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5117-7920","authenticated-orcid":false,"given":"Shaojun","family":"Wei","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6942-4395","authenticated-orcid":false,"given":"Yang","family":"Hu","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2309-572X","authenticated-orcid":false,"given":"Shouyi","family":"Yin","sequence":"additional","affiliation":[{"name":"School of Integrated Circuits, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"issue":"8","key":"ref1","first-page":"9","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI Blog"},{"key":"ref2","article-title":"GPT-4 technical report","author":"Achiam","year":"2023"},{"key":"ref3","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018"},{"key":"ref4","article-title":"The LLaMA 4 herd: The beginning of a new era of natively multimodal AI innovation","author":"Ai","year":"2025"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00035"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00060"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480125"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3503222.3507738"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589057"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00018"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2022.3170848"},{"key":"ref12","first-page":"16344","article-title":"FlashAttention: Fast and memory-efficient exact attention with IO-awareness","volume":"35","author":"Dao","year":"2022","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/1498765.1498785"},{"key":"ref14","article-title":"FlashAttention-2: Faster attention with better parallelism and work partitioning","author":"Dao","year":"2023"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1017\/cbo9780511921698"},{"key":"ref16","article-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/MCAS.2024.3349669"},{"key":"ref18","article-title":"WATOS: Efficient LLM training strategies and architecture co-exploration for wafer-scale chip","author":"Wang","year":"2025"},{"key":"ref19","article-title":"TEMP: A memory efficient physical-aware tensor partition-mapping framework on wafer-scale chips","author":"Wang","year":"2025"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2010.5470853"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/HCS55958.2022.9895534"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00061"},{"key":"ref23","article-title":"BLOOM: A 176B-parameter open-access multilingual language model","author":"Scao","year":"2022"},{"key":"ref24","article-title":"LLaMa: Open and efficient foundation language models","author":"Touvron","year":"2023"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00286"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2015.2414456"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO61859.2024.00093"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ispass57527.2023.00035"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2022.3229690"},{"key":"ref30","article-title":"Ring attention with blockwise transformers for near-infinite context","author":"Liu","year":"2023"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358302"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071027"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3370748.3406567"},{"key":"ref34","first-page":"571","article-title":"SALO: An efficient spatial accelerator enabling hybrid sparse attention mechanisms for long sequences","volume-title":"Proc. ACM\/IEEE Des. Autom. Conf.","author":"Shen","year":"2022"},{"key":"ref35","article-title":"PADE: A predictor-free sparse attention accelerator via unified execution and stage fusion","author":"Wang","year":"2025"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2024.3373592"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TCSII.2025.3596228"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00017"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00029"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICDSP.2018.8631556"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3725843.3756037"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00011"},{"key":"ref43","first-page":"1106","article-title":"HighLight: Efficient and flexible DNN acceleration with hierarchical structured sparsity","volume-title":"Proc. IEEE Int. Symp. Microarchit.","author":"Wu","year":"2023"}],"container-title":["IEEE Transactions on Computers"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/12\/11392777\/11313790.pdf?arnumber=11313790","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T20:58:59Z","timestamp":1770929939000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11313790\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3]]},"references-count":43,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tc.2025.3648055","relation":{},"ISSN":["0018-9340","1557-9956","2326-3814"],"issn-type":[{"value":"0018-9340","type":"print"},{"value":"1557-9956","type":"electronic"},{"value":"2326-3814","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3]]}}}