{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T21:03:20Z","timestamp":1774904600806,"version":"3.50.1"},"reference-count":33,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Institute for Information and communications Technology Promotion (IITP) grant funded by the Korea government","award":["RS-2025-02264029"],"award-info":[{"award-number":["RS-2025-02264029"]}]},{"name":"Integration and Validation of an AI Semiconductor-Based Data Center Training and Inference System"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE J. Solid-State Circuits"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1109\/jssc.2026.3663603","type":"journal-article","created":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T21:01:02Z","timestamp":1772830862000},"page":"1513-1525","source":"Crossref","is-referenced-by-count":0,"title":["Adelia: A 4-nm LLM Processing Unit With Streamlined Dataflow and Dual-Mode Parallelism for Maximizing Hardware Efficiency"],"prefix":"10.1109","volume":"61","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5743-4852","authenticated-orcid":false,"given":"Sukbin","family":"Lim","sequence":"first","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4702-6489","authenticated-orcid":false,"given":"Jung-Hoon","family":"Kim","sequence":"additional","affiliation":[{"name":"KAIST, Daejeon, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-5924-7000","authenticated-orcid":false,"given":"Seungjae","family":"Moon","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junseo","family":"Cha","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dongjin","family":"Seo","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jongho","family":"Kim","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hunjong","family":"Lee","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jinwon","family":"Lee","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Joo-Young","family":"Kim","sequence":"additional","affiliation":[{"name":"HyperAccel, Seoul, South Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805"},{"key":"ref3","article-title":"GPT-4 technical report","volume-title":"arXiv:2303.08774","author":"Achiam","year":"2023"},{"key":"ref4","article-title":"Qwen technical report","volume-title":"arXiv:2309.16609","author":"Bai","year":"2023"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2010.11929"},{"key":"ref6","article-title":"Latte: Latent diffusion transformer for video generation","author":"Ma","year":"2024","journal-title":"arXiv:2401.03048"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2025.xxi.010"},{"key":"ref8","article-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020","journal-title":"arXiv:2001.08361"},{"key":"ref9","article-title":"Scaling LLM test-time compute optimally can be more effective than scaling model parameters","author":"Snell","year":"2024","journal-title":"arXiv:2408.03314"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.52202\/068431-1800"},{"key":"ref11","article-title":"DeepSeek-R1: Incentivizing reasoning capability in LLMs via reinforcement learning","author":"DeepSeek-AI","year":"2025","journal-title":"arXiv:2501.12948"},{"key":"ref12","article-title":"Self-consistency improves chain of thought reasoning in language models","author":"Wang","year":"2022","journal-title":"arXiv:2203.11171"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00051"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3600006.3613165"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.23919\/VLSITechnologyandCir65189.2025.11075108"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.52202\/068431-1189"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18074.2021.9586134"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2024.3420728"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00077"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA61900.2025.00111"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731019"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/VLSITechnologyandCir46783.2024.10631397"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00019"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731051"},{"key":"ref25","first-page":"117","article-title":"Taming throughput-latency tradeoff in LLM inference with Sarathi-serve","volume-title":"Proc. 18th USENIX Symp. Operating Syst. Design Implement. (OSDI)","author":"Agrawal"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3642970.3655835"},{"key":"ref27","article-title":"Optimizing LLM inference throughput via memory-aware and SLA-constrained dynamic batching","author":"Pang","year":"2025","journal-title":"arXiv:2503.05248"},{"key":"ref28","first-page":"521","article-title":"Orca: A distributed serving system for transformer-based generative models","volume-title":"Proc. 16th USENIX Symp. Operating Syst. Design Implement. (OSDI)","author":"Yu"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1144"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/VLSITechnologyandCir46769.2022.9830277"},{"key":"ref31","first-page":"342","article-title":"22.9 a 12 nm 18.1TFLOPs\/W sparse transformer processor with entropy-based early exit, mixed-precision predication and fine-grained power management","volume-title":"IEEE Int. Solid-State Circuits Conf. (ISSCC) Dig. Tech. Papers","author":"Tambe"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.23919\/vlsitechnologyandcir57934.2023.10185403"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC49657.2024.10454330"}],"container-title":["IEEE Journal of Solid-State Circuits"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/4\/11457062\/11423855.pdf?arnumber=11423855","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T20:06:57Z","timestamp":1774901217000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11423855\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":33,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/jssc.2026.3663603","relation":{},"ISSN":["0018-9200","1558-173X"],"issn-type":[{"value":"0018-9200","type":"print"},{"value":"1558-173X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]}}}