{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:38:13Z","timestamp":1759333093459,"version":"3.28.0"},"reference-count":15,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,4,22]],"date-time":"2024-04-22T00:00:00Z","timestamp":1713744000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,4,22]],"date-time":"2024-04-22T00:00:00Z","timestamp":1713744000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006180","name":"Technology Development","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006180","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,4,22]]},"DOI":"10.1109\/aicas59952.2024.10595857","type":"proceedings-article","created":{"date-parts":[[2024,7,19]],"date-time":"2024-07-19T17:30:48Z","timestamp":1721410248000},"page":"307-311","source":"Crossref","is-referenced-by-count":2,"title":["A Low-Latency and Scalable Vector Engine with Operation Fusion for Transformers"],"prefix":"10.1109","author":[{"given":"Mincheol","family":"Cha","sequence":"first","affiliation":[{"name":"Seoul National University,Inter-University Semiconductor Research Center (ISRC),Department of Electrical and Computer Engineering,Seoul,Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Keehyuk","family":"Lee","sequence":"additional","affiliation":[{"name":"Seoul National University,Inter-University Semiconductor Research Center (ISRC),Department of Electrical and Computer Engineering,Seoul,Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuan Truong","family":"Nguyen","sequence":"additional","affiliation":[{"name":"Seoul National University,Inter-University Semiconductor Research Center (ISRC),Department of Electrical and Computer Engineering,Seoul,Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hyuk-Jae","family":"Lee","sequence":"additional","affiliation":[{"name":"Seoul National University,Inter-University Semiconductor Research Center (ISRC),Department of Electrical and Computer Engineering,Seoul,Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"article-title":"Efficient kernel fusion techniques for massive video data analysis on gpgpus","year":"2015","author":"Adnan","key":"ref1"},{"article-title":"Layer normalization","year":"2016","author":"Ba","key":"ref2"},{"key":"ref3","first-page":"16344","article-title":"Flashattention: Fast and memory-efficient exact attention with io-awareness","volume":"35","author":"Dao","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","year":"2020","author":"Dosovitskiy","key":"ref4"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00051"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3564606"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCE-Asia59966.2023.10326397"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3505244"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3370748.3406567"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICESS.2019.8782524"},{"issue":"8","key":"ref11","first-page":"9","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI blog"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2023\/149"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/GreenCom-CPSCom.2010.102"},{"key":"ref15","article-title":"Understanding and improving layer normalization","volume":"32","author":"Xu","year":"2019","journal-title":"Advances in Neural Information Processing Systems"}],"event":{"name":"2024 IEEE 6th International Conference on AI Circuits and Systems (AICAS)","start":{"date-parts":[[2024,4,22]]},"location":"Abu Dhabi, United Arab Emirates","end":{"date-parts":[[2024,4,25]]}},"container-title":["2024 IEEE 6th International Conference on AI Circuits and Systems (AICAS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10595550\/10595552\/10595857.pdf?arnumber=10595857","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,20]],"date-time":"2024-07-20T05:04:53Z","timestamp":1721451893000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10595857\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,22]]},"references-count":15,"URL":"https:\/\/doi.org\/10.1109\/aicas59952.2024.10595857","relation":{},"subject":[],"published":{"date-parts":[[2024,4,22]]}}}