{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,12]],"date-time":"2025-03-12T04:18:35Z","timestamp":1741753115317,"version":"3.38.0"},"reference-count":25,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,11,3]],"date-time":"2024-11-03T00:00:00Z","timestamp":1730592000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,11,3]],"date-time":"2024-11-03T00:00:00Z","timestamp":1730592000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,3]]},"DOI":"10.1109\/iecon55916.2024.10905965","type":"proceedings-article","created":{"date-parts":[[2025,3,10]],"date-time":"2025-03-10T17:32:07Z","timestamp":1741627927000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["A 77.79 GOPs\/W Retentive Network FPGA Inference Accelerator with Optimized Workload"],"prefix":"10.1109","author":[{"given":"Cheng","family":"Nian","sequence":"first","affiliation":[{"name":"Research Institute of Tsinghua University in Shenzhen,Greater Bay Area National Center of Technology Innovation,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Weiyi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Integrated Circuits,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fasih Ud","family":"Din Farrukh","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Integrated Circuits,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Liting","family":"Niu","sequence":"additional","affiliation":[{"name":"Tsinghua University,School of Integrated Circuits,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dapeng","family":"Jiang","sequence":"additional","affiliation":[{"name":"Tsinghua University,Xingjian College,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fei","family":"Chen","sequence":"additional","affiliation":[{"name":"Research Institute of Tsinghua University in Shenzhen,Greater Bay Area National Center of Technology Innovation,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chun","family":"Zhang","sequence":"additional","affiliation":[{"name":"Research Institute of Tsinghua University in Shenzhen,Greater Bay Area National Center of Technology Innovation,China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.4324\/9781410605337-29"},{"key":"ref2","article-title":"Sequence to sequence learning with neural networks","volume-title":"Advances in neural information processing systems","volume":"27","author":"Sutskever"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1126\/science.aar6404"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref6","first-page":"16344","article-title":"Flashattention: Fast and memory-efficient exact attention with io-awareness","volume-title":"Advances in Neural Information Processing Systems","volume":"35","author":"Dao"},{"article-title":"Retentive network: A successor to transformer for large language models","year":"2023","author":"Sun","key":"ref7"},{"article-title":"Vir: Vision retention networks","year":"2023","author":"Hatamizadeh","key":"ref8"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2016.2616357"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2019.2960488"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2022.3205713"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC42614.2022.9731686"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2023.3234893"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TCSII.2022.3196055"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS48785.2022.9937659"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/SOCC49529.2020.9524802"},{"issue":"1","key":"ref17","first-page":"5","article-title":"Swish: a self-gated activation function","volume":"7","author":"Ramachandran","year":"2017"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2018","author":"Devlin","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-2074"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.127063"},{"article-title":"Llama: Open and efficient foundation language models","year":"2023","author":"Touvron","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.26"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.816"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-3210"}],"event":{"name":"IECON 2024 - 50th Annual Conference of the IEEE Industrial Electronics Society","start":{"date-parts":[[2024,11,3]]},"location":"Chicago, IL, USA","end":{"date-parts":[[2024,11,6]]}},"container-title":["IECON 2024 - 50th Annual Conference of the IEEE Industrial Electronics Society"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10904979\/10905066\/10905965.pdf?arnumber=10905965","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,11]],"date-time":"2025-03-11T05:22:24Z","timestamp":1741670544000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10905965\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,3]]},"references-count":25,"URL":"https:\/\/doi.org\/10.1109\/iecon55916.2024.10905965","relation":{},"subject":[],"published":{"date-parts":[[2024,11,3]]}}}