{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T09:48:33Z","timestamp":1777888113156,"version":"3.51.4"},"reference-count":11,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Institute of Information &#x0026; Communications Technology Planning"},{"name":"Ministry of Science and ICT, Korea","award":["IITP-2026-RS-2021-II211817 40"],"award-info":[{"award-number":["IITP-2026-RS-2021-II211817 40"]}]},{"name":"Ministry of Science and ICT, Korea","award":["RS-2023-00216370"],"award-info":[{"award-number":["RS-2023-00216370"]}]},{"DOI":"10.13039\/501100003725","name":"National Research Foundation of Korea","doi-asserted-by":"publisher","award":["NRF RS-2024-00347114"],"award-info":[{"award-number":["NRF RS-2024-00347114"]}],"id":[{"id":"10.13039\/501100003725","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Samsung Advanced Institute of Technology and Samsung Electronics Company","award":["MEM240728_0001"],"award-info":[{"award-number":["MEM240728_0001"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Comput. Arch. Lett."],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1109\/lca.2026.3684216","type":"journal-article","created":{"date-parts":[[2026,4,16]],"date-time":"2026-04-16T19:51:58Z","timestamp":1776369118000},"page":"158-161","source":"Crossref","is-referenced-by-count":0,"title":["An Operand Divergence-Aware All-Bank PIM Architecture for Sparse Attention"],"prefix":"10.1109","volume":"25","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-0886-6794","authenticated-orcid":false,"given":"Soojin","family":"Hwang","sequence":"first","affiliation":[{"name":"ETRI, Daejeon, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sanghyeon","family":"Lee","sequence":"additional","affiliation":[{"name":"KAIST, Daejeon, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-1267-2813","authenticated-orcid":false,"given":"Juhyun","family":"Lee","sequence":"additional","affiliation":[{"name":"KAIST, Daejeon, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1742-047X","authenticated-orcid":false,"given":"Jaehyuk","family":"Huh","sequence":"additional","affiliation":[{"name":"KAIST, Daejeon, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00013"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/HCS55958.2022.9895629"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00034"},{"key":"ref4","first-page":"47901","article-title":"Quest: Query-aware sparsity for efficient long-context LLM inference","volume-title":"Proc. 41st Int. Conf. Mach. Learn.","author":"Tang"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3603113"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3620666.3651380"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731008"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3676641.3716267"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2020.2973991"},{"key":"ref10","article-title":"Cloud TPU","year":"2018"},{"key":"ref11","article-title":"Introducing LLAMA 3.1","volume-title":"Meta AI Blog","year":"2024"}],"container-title":["IEEE Computer Architecture Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10208\/11321093\/11481778.pdf?arnumber=11481778","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T04:35:48Z","timestamp":1777610148000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11481778\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1]]},"references-count":11,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/lca.2026.3684216","relation":{},"ISSN":["1556-6056","1556-6064","2473-2575"],"issn-type":[{"value":"1556-6056","type":"print"},{"value":"1556-6064","type":"electronic"},{"value":"2473-2575","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1]]}}}