{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T13:07:25Z","timestamp":1770728845583,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":4,"publisher":"ACM","funder":[{"name":"Advanced Micro Devices &#x28;AMD&#x29;","award":["FA&#x5c;&#x2f;OTHER-24-0001"],"award-info":[{"award-number":["FA&#x5c;&#x2f;OTHER-24-0001"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,2,22]]},"DOI":"10.1145\/3748173.3779572","type":"proceedings-article","created":{"date-parts":[[2026,2,5]],"date-time":"2026-02-05T21:17:35Z","timestamp":1770326255000},"page":"179-179","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["FARE: A\n                    <u>F<\/u>\n                    ine-gr\n                    <u>a<\/u>\n                    ined Pipelined\n                    <u>Re<\/u>\n                    configurable FlashAttention Kernel"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-5016-112X","authenticated-orcid":false,"given":"Kaushikkumar S.","family":"Rathva","sequence":"first","affiliation":[{"name":"Indian Institute of Science (IISc), Bengaluru, Karnataka, India"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-6906-6993","authenticated-orcid":false,"given":"Aakarsh","family":"Alam","sequence":"additional","affiliation":[{"name":"Indian Institute of Technology (IIT), Kharagpur, Kharagpur, West Bengal, India"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8171-5891","authenticated-orcid":false,"given":"Srini","family":"Srinivasan","sequence":"additional","affiliation":[{"name":"Advanced Micro Devices, Inc. (AMD), Santa Clara, California, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9294-1603","authenticated-orcid":false,"given":"Sumit K.","family":"Mandal","sequence":"additional","affiliation":[{"name":"Indian Institute of Science (IISc), Bengaluru, Karnataka, India"}]}],"member":"320","published-online":{"date-parts":[[2026,2,21]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Flashattention: Fast and memory-efficient exact attention with io-awareness. Advances in neural information processing systems 35","author":"Dao Tri","year":"2022","unstructured":"Tri Dao, Dan Fu, Stefano Ermon, Atri Rudra, and Christopher R\u00e9. 2022. Flashattention: Fast and memory-efficient exact attention with io-awareness. Advances in neural information processing systems 35 (2022), 16344-16359."},{"key":"e_1_3_2_1_2_1","volume-title":"Sujitha Ravichandran, K Adarsh, H Bharath Bhat, Biresh Kumar Joardar, and Sumit K Mandal.","author":"Jaiswal Abhi","year":"2024","unstructured":"Abhi Jaiswal, KC Sharin Shahana, Sujitha Ravichandran, K Adarsh, H Bharath Bhat, Biresh Kumar Joardar, and Sumit K Mandal. 2024. HALO: Communicationaware Heterogeneous 2.5 D System for Energy-efficient LLM Execution at Edge. IEEE Journal on Emerging and Selected Topics in Circuits and Systems (2024)."},{"key":"e_1_3_2_1_3_1","volume-title":"Attention is all you need. Advances in neural information processing systems 30","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, ?ukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_2_1_4_1","volume-title":"Efficient Implementation of Transformer Inference via a Tiled-Based Architecture on an FPGA. ([n.d.]). accessed","author":"Yang Ling-Chi","year":"2025","unstructured":"Ling-Chi Yang, Chi-Jui Chen, Trung Le, Bo-Cheng Lai, Scott Hauck, and Shih-Chieh Hsu. [n.d.]. Efficient Implementation of Transformer Inference via a Tiled-Based Architecture on an FPGA. ([n.d.]). accessed 19 August 2025."}],"event":{"name":"FPGA '26:The 2026 ACM\/SIGDA International Symposium on Field Programmable Gate Arrays","location":"Seaside CA USA","sponsor":["SIGDA ACM Special Interest Group on Design Automation"]},"container-title":["Proceedings of the 2026 ACM\/SIGDA International Symposium on Field Programmable Gate Arrays"],"original-title":[],"deposited":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T16:17:09Z","timestamp":1770653829000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3748173.3779572"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,21]]},"references-count":4,"alternative-id":["10.1145\/3748173.3779572","10.1145\/3748173"],"URL":"https:\/\/doi.org\/10.1145\/3748173.3779572","relation":{},"subject":[],"published":{"date-parts":[[2026,2,21]]},"assertion":[{"value":"2026-02-21","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}