{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T06:12:26Z","timestamp":1758089546731,"version":"3.44.0"},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,22]],"date-time":"2025-06-22T00:00:00Z","timestamp":1750550400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,22]],"date-time":"2025-06-22T00:00:00Z","timestamp":1750550400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,22]]},"DOI":"10.1109\/dac63849.2025.11132895","type":"proceedings-article","created":{"date-parts":[[2025,9,15]],"date-time":"2025-09-15T17:35:41Z","timestamp":1757957741000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["MambaOPU: An FPGA Overlay Processor for State-space-duality-based Mamba Models"],"prefix":"10.1109","author":[{"given":"Shaoqiang","family":"Lu","sequence":"first","affiliation":[{"name":"Ningbo Institute of Digital Twin, Eastern Institute of Technology,Ningbo,China"}]},{"given":"Xuliang","family":"Yu","sequence":"additional","affiliation":[{"name":"Zhejiang University,Hangzhou,China"}]},{"given":"Tiandong","family":"Zhao","sequence":"additional","affiliation":[{"name":"University of California,Los Angeles,USA"}]},{"given":"Siyuan","family":"Miao","sequence":"additional","affiliation":[{"name":"University of California,Los Angeles,USA"}]},{"given":"Xinsong","family":"Sheng","sequence":"additional","affiliation":[{"name":"Zhejiang University,Hangzhou,China"}]},{"given":"Chen","family":"Wu","sequence":"additional","affiliation":[{"name":"Ningbo Institute of Digital Twin, Eastern Institute of Technology,Ningbo,China"}]},{"given":"Liang","family":"Zhao","sequence":"additional","affiliation":[{"name":"Zhejiang University,Hangzhou,China"}]},{"given":"Ting-Jung","family":"Lin","sequence":"additional","affiliation":[{"name":"Ningbo Institute of Digital Twin, Eastern Institute of Technology,Ningbo,China"}]},{"given":"Lei","family":"He","sequence":"additional","affiliation":[{"name":"Ningbo Institute of Digital Twin, Eastern Institute of Technology,Ningbo,China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00037"},{"key":"ref2","article-title":"REFINE: A Fine-Grained medication recommendation system using deep learning and personalized drug interaction modeling","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Bhoi","year":"2023"},{"key":"ref3","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations (ICLR)","author":"Dosovitskiy","key":"ref4"},{"article-title":"Learning transferable visual models from natural language supervision","volume-title":"International Conference on Machine Learning (ICML)","author":"Radford","key":"ref5"},{"key":"ref6","article-title":"Mamba: Linear-time sequence modeling with selective state spaces","volume-title":"arXiv preprint arXiv:2312.00752","author":"Gu","year":"2024"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00035"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00018"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480095"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071047"},{"key":"ref11","doi-asserted-by":"crossref","DOI":"10.1145\/3676536.3676660","article-title":"AESHA: Accelerating eigen-decomposition-based sparse transformer with hybrid RRAM-SRAM architecture","volume-title":"International Conference on Computer Aided Design (ICCAD)","author":"Yu"},{"key":"ref12","doi-asserted-by":"crossref","DOI":"10.1145\/3676536.3676761","article-title":"ChatOPU: An FPGA-based overlay processor for large language models with unstructured sparsity","volume-title":"International Conference on Computer-Aided Design (ICCAD)","author":"Zhao"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3626202.3637562"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TVLSI.2020.2995741"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/FPL57034.2022.00073"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3373087.3375311"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3503222.3507738"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071081"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00060"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589057"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/FPL60245.2023.00015"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2022.3197489"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3307650.3322214"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD51958.2021.9643487"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00051"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TVLSI.2019.2939726"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3474597"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/FPL53798.2021.00014"},{"key":"ref29","article-title":"Combining recurrent, convolutional, and continuous-time models with linear state space layers","author":"Gu","year":"2021","journal-title":"Advances in neural information processing systems (NeurIPS)"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3676536.3676798"},{"article-title":"Transformers are SSMs: Generalized models and efficient algorithms through structured state space duality","volume-title":"International Conference on Machine Learning (ICML)","author":"Dao","key":"ref31"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2021.3061394"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3079856.3080246"},{"key":"ref34","article-title":"Structured state space models for in-context reinforcement learning","author":"Lu","year":"2023","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"article-title":"Efficiently modeling long sequences with structured state spaces","volume-title":"International Conference on Learning Representations (ICLR)","author":"Gu","key":"ref35"},{"article-title":"Effectively modeling time series with simple discrete state spaces","volume-title":"International Conference on Learning Representations (ICLR)","author":"Michael","key":"ref36"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3431920.3439477"},{"key":"ref38","article-title":"Root mean square layer normalization","author":"Zhang","year":"2019","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ISEDA62518.2024.10617729"},{"key":"ref40","article-title":"Quamba: A post-training quantization recipe for selective state space models","author":"Chiang","year":"2024","journal-title":"arXiv preprint arXiv:2410.13229"},{"key":"ref41","article-title":"Mamba statespace models can be strong downstream learners","author":"Halloran","year":"2024","journal-title":"arXiv preprint arXiv:2406.00209"},{"year":"2022","key":"ref42","article-title":"Vitis unified software platform documentation: Application acceleration development (ug1393)"},{"year":"2020","key":"ref43","article-title":"Nvidia ampere architecture whitepaper"}],"event":{"name":"2025 62nd ACM\/IEEE Design Automation Conference (DAC)","start":{"date-parts":[[2025,6,22]]},"location":"San Francisco, CA, USA","end":{"date-parts":[[2025,6,25]]}},"container-title":["2025 62nd ACM\/IEEE Design Automation Conference (DAC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11132383\/11132091\/11132895.pdf?arnumber=11132895","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T05:24:44Z","timestamp":1758000284000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11132895\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,22]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/dac63849.2025.11132895","relation":{},"subject":[],"published":{"date-parts":[[2025,6,22]]}}}