{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,19]],"date-time":"2025-12-19T15:49:23Z","timestamp":1766159363458,"version":"3.28.0"},"reference-count":62,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T00:00:00Z","timestamp":1709337600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T00:00:00Z","timestamp":1709337600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100011661","name":"Pacific Northwest National Laboratory","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100011661","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000266","name":"Engineering and Physical Sciences Research Council","doi-asserted-by":"publisher","award":["EP\/R513222\/1"],"award-info":[{"award-number":["EP\/R513222\/1"]}],"id":[{"id":"10.13039\/501100000266","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,3,2]]},"DOI":"10.1109\/cgo57630.2024.10444801","type":"proceedings-article","created":{"date-parts":[[2024,2,28]],"date-time":"2024-02-28T18:47:35Z","timestamp":1709146055000},"page":"143-157","source":"Crossref","is-referenced-by-count":3,"title":["AXI4MLIR: User-Driven Automatic Host Code Generation for Custom AXI-Based Accelerators"],"prefix":"10.1109","author":[{"given":"Nicolas Bohm","family":"Agostini","sequence":"first","affiliation":[{"name":"Northeastern University,Boston,MA,USA"}]},{"given":"Jude","family":"Haris","sequence":"additional","affiliation":[{"name":"University of Glasgow,Glasgow,Scotland,UK"}]},{"given":"Perry","family":"Gibson","sequence":"additional","affiliation":[{"name":"University of Glasgow,Glasgow,Scotland,UK"}]},{"given":"Malith","family":"Jayaweera","sequence":"additional","affiliation":[{"name":"Northeastern University,Boston,MA,USA"}]},{"given":"Norm","family":"Rubin","sequence":"additional","affiliation":[{"name":"Northeastern University,Boston,MA,USA"}]},{"given":"Antonino","family":"Tumeo","sequence":"additional","affiliation":[{"name":"Pacific Northwest National Laboratory,Richland,WA,USA"}]},{"given":"Jos\u00e9 L.","family":"Abell\u00e1n","sequence":"additional","affiliation":[{"name":"University of Murcia,Murcia,Spain"}]},{"given":"Jos\u00e9","family":"Cano","sequence":"additional","affiliation":[{"name":"University of Glasgow,Glasgow,Scotland,UK"}]},{"given":"David","family":"Kaeli","sequence":"additional","affiliation":[{"name":"Northeastern University,Boston,MA,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/isca.2018.00011"},{"key":"ref2","first-page":"247","article-title":"Hirac: A hierarchical accelerator with sorting-based packing for spgemms in dnn applications","volume-title":"IEEE International Symposium on High-Performance Computer Architecture, ser. HPCA23","author":"Shabani"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/hpca56546.2023.10070992"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527409"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3582016.3582068"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527440"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3582016.3582069"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1038\/s44160-022-00231-0"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3194085.3194087"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-021-03819-2"},{"key":"ref11","first-page":"1","article-title":"DNNExplorer: A Framework for Modeling and Exploring a Novel Paradigm of FPGA-based DNN Accelerator","volume-title":"Proceedings of the 39th International Conference on Computer-Aided Design, ser. ICCAD20","author":"Zhang"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3373087.3375306"},{"article-title":"Hybriddnn: A framework for high-performance hybrid dnn accelerator design and implementation","volume-title":"Proceedings of the 57th ACM\/EDAC\/IEEE Design Automation Conference, ser. DAC20","author":"Hanchen","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/mm.2020.2985963"},{"key":"ref15","article-title":"DLAS: An Exploration and Assessment of the Deep Learning Acceleration Stack","author":"Gibson","year":"2023","journal-title":"arXiv"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/fccm.2018.00022"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/jetcas.2019.2910232"},{"volume-title":"VTA:Deep learning accelerator stack","year":"2020","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1088\/2632-2153\/aba042"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/sbac-pad49847.2020.00013"},{"volume-title":"AMBA AXI andACE ProtocolSpecification","year":"2020","author":"Developers","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3242900"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/cgo51591.2021.9370308"},{"volume-title":"linalg\u2019 Dialect","year":"2020","author":"Developers","key":"ref24"},{"issue":"0","key":"ref25","first-page":"1","article-title":"Compiling ONNX Neural Network Models Using MLIR","volume":"0","author":"Le","year":"2020","journal-title":"ArXiv"},{"key":"ref26","first-page":"265","article-title":"TensorFlow: A System for Large-Scale Machine Learning","volume-title":"Proceedings of the 12th USENIX conference on Operating Systems Design and Implementation, ser. OSDI","author":"Abadi","year":"2016"},{"volume-title":"PyTorch: tensors and dynamic neural networks in Python with strong GPU acceleration","year":"2017","key":"ref27"},{"volume-title":"AXI Reference Guide","year":"2012","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3579990.3580024"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/mcse.2010.69"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3388333.3388649"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1016\/j.jpdc.2022.11.005"},{"issue":"0","key":"ref33","first-page":"1","article-title":"Tinybert: Distilling bert for natural language understanding","volume":"0","author":"Jiao","year":"2019","journal-title":"arXiv preprint"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/micro.2014.58"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/2684746.2689060"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3007787.3001138"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/micro.2016.7783723"},{"volume-title":"Perf wiki","year":"2023","author":"Linux","key":"ref38"},{"volume-title":"Neon registers","year":"2023","key":"ref39"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2017.683"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-demos.6"},{"volume-title":"The Torch-MLIR Project","year":"2021","key":"ref42"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/asap.2018.8445108"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/mm.2022.3178580"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1145\/3508352.3549424"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ispass55109.2022.00042"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3490422.3502369"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/3289602.3293910"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378514"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3358198"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/3240765.3240838"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/isca52012.2021.00050"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/cgo53902.2022.9741281"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/micro50266.2020.00058"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378508"},{"key":"ref56","article-title":"Learning to optimize tensor programs","volume-title":"Advances in Neural Information Processing Systems, ser. NeurIPS18","volume":"31","author":"Chen","year":"2018"},{"key":"ref57","first-page":"863","article-title":"Ansor: Generating High-Performance tensor programs for deep learning","volume-title":"14th USENIX symposium on operating systems design and implementation, ser. OSDI20","author":"Zheng","year":"2020"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1145\/3579990.3580025"},{"volume-title":"Transform Dialect: Fine-grain transformation control dialect","year":"2022","author":"Developers","key":"ref59"},{"volume-title":"judeharis\/axi_mlir: CGO 2024 Artifact v1.3.1","year":"2023","author":"Agostini","key":"ref60"},{"volume-title":"AXI4MLIR\/axi4mlir: CGO 2024 Artifact v1.3.2","year":"2024","author":"Agostini","key":"ref61"},{"volume-title":"AXI4MLIR\/axi4mlir","year":"2023","author":"Agostini","key":"ref62"}],"event":{"name":"2024 IEEE\/ACM International Symposium on Code Generation and Optimization (CGO)","start":{"date-parts":[[2024,3,2]]},"location":"Edinburgh, United Kingdom","end":{"date-parts":[[2024,3,6]]}},"container-title":["2024 IEEE\/ACM International Symposium on Code Generation and Optimization (CGO)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10444766\/10444770\/10444801.pdf?arnumber=10444801","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T05:46:28Z","timestamp":1709271988000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10444801\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,2]]},"references-count":62,"URL":"https:\/\/doi.org\/10.1109\/cgo57630.2024.10444801","relation":{},"subject":[],"published":{"date-parts":[[2024,3,2]]}}}