{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T16:14:45Z","timestamp":1771949685777,"version":"3.50.1"},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,1,22]],"date-time":"2024-01-22T00:00:00Z","timestamp":1705881600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,1,22]],"date-time":"2024-01-22T00:00:00Z","timestamp":1705881600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000028","name":"Semiconductor Research Corporation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000028","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,1,22]]},"DOI":"10.1109\/asp-dac58780.2024.10473893","type":"proceedings-article","created":{"date-parts":[[2024,3,25]],"date-time":"2024-03-25T19:06:53Z","timestamp":1711393613000},"page":"435-441","source":"Crossref","is-referenced-by-count":15,"title":["Invited Paper: Software\/Hardware Co-design for LLM and Its Application for Design Verification"],"prefix":"10.1109","author":[{"given":"Lily Jiaxin","family":"Wan","sequence":"first","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]},{"given":"Yingbing","family":"Huang","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]},{"given":"Yuhong","family":"Li","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]},{"given":"Hanchen","family":"Ye","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]},{"given":"Jinghua","family":"Wang","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]},{"given":"Xiaofan","family":"Zhang","sequence":"additional","affiliation":[{"name":"Google"}]},{"given":"Deming","family":"Chen","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00120"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1613\/jair.4992"},{"key":"ref3","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref4","article-title":"Training language models to follow instructions with human feedback","author":"Ouyang","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref5","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023","journal-title":"arXiv preprint arXiv:2307.09288"},{"key":"ref6","volume-title":"An important next step on our AI journey","author":"Pichai","year":"2023"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/MLCAD58807.2023.10299874"},{"key":"ref8","article-title":"RTLLM: An Open-Source Benchmark for Design RTL Generation with Large Language Model","author":"Lu","year":"2023","journal-title":"arXiv preprint arXiv:2308.05345"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.23919\/DATE56975.2023.10137086"},{"key":"ref10","article-title":"Codegen: An open large language model for code with multi-turn program synthesis","author":"Nijkamp","year":"2022","journal-title":"arXiv preprint arXiv:2203.13474"},{"key":"ref11","article-title":"VerilogEval: Evaluating Large Language Models for Verilog Code Generation","author":"Liu","year":"2023","journal-title":"arXiv preprint arXiv:2309.07544"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/MLCAD58807.2023.10299852"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3240765.3240801"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18072.2020.9218684"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3400302.3415609"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3194554.3194597"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3431920.3439290"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/SAAHPC.2011.22"},{"key":"ref19","article-title":"Llm. int8 (): 8-bit matrix multiplication for transformers at scale","author":"Dettmers","year":"2022","journal-title":"arXiv preprint arXiv:2208.07339"},{"key":"ref20","article-title":"Smoothquant: Accurate and efficient post-training quantization for large language models","volume-title":"Proc. of ICML","author":"Xiao"},{"key":"ref21","volume-title":"SparseGPT: Massive Language Models Can Be Accurately Pruned in One-Shot","author":"Frantar","year":"2023"},{"key":"ref22","article-title":"LLM-Pruner: On the Structural Pruning of Large Language Models","author":"Ma","year":"2023","journal-title":"arXiv preprint arXiv:2305.11627"},{"key":"ref23","article-title":"Deja Vu: Contextual Sparsity for Efficient LLMs at Inference Time","volume-title":"Proc. of ICML","author":"Liu"},{"key":"ref24","article-title":"The case for 4-bit precision: k-bit inference scaling laws","volume-title":"Proc. of ICML","author":"Dettmers"},{"key":"ref25","volume-title":"OPT: Open Pre-trained Transformer Language Models","author":"Zhang","year":"2022"},{"key":"ref26","article-title":"Flashattention-2: Faster attention with better parallelism and work partitioning","author":"Dao","year":"2023","journal-title":"arXiv preprint arXiv:2307.08691"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1201\/9781420007954"},{"key":"ref28","volume-title":"Functional verification coverage measurement and analysis","author":"Piziali","year":"2007"},{"key":"ref29","volume-title":"Part 8: The 2020 wilson research group functional verification study","author":"Foster","year":"2021"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/6.591665"},{"key":"ref31","volume-title":"AMD Ryzen 9 3900X and Ryzen 7 3700X Review","author":"Alcorn","year":"2019"},{"key":"ref32","volume-title":"AMD Ryzen 7 5800H Specifications","year":"2021"},{"key":"ref33","article-title":"Workshops on Extreme Scale Design Automation (ESDA) challenges and opportunities for 2025 and beyond","volume-title":"arXiv preprint arXiv:2005.01588","author":"Bahar"},{"key":"ref34","volume-title":"GPT-4 Technical Report","year":"2023"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3020078.3021744"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/FPL60245.2023.00037"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/2847263.2847274"},{"key":"ref38","article-title":"hls4ml: An open-source codesign workflow to empower scientific low-power machine learning devices","author":"Fahim","year":"2021","journal-title":"arXiv preprint arXiv:2103.05579"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2014.6983050"},{"key":"ref40","volume-title":"HLS based Open-Source IPs for Deep Neural Network Acceleration","author":"Liu","year":"2019"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-11404-6_3"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3174243.3174255"},{"key":"ref43","volume-title":"Vitis-HLS-Introductory-Examples","year":"2023"},{"key":"ref44","volume-title":"Vitis libraries","year":"2019"},{"key":"ref45","volume-title":"Tacle Bench","year":"2017"},{"key":"ref46","volume-title":"Robust and reliable hardware accelerator design through high-level synthesis","author":"Campbell","year":"2017"}],"event":{"name":"2024 29th Asia and South Pacific Design Automation Conference (ASP-DAC)","location":"Incheon, Korea, Republic of","start":{"date-parts":[[2024,1,22]]},"end":{"date-parts":[[2024,1,25]]}},"container-title":["2024 29th Asia and South Pacific Design Automation Conference (ASP-DAC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10473777\/10473787\/10473893.pdf?arnumber=10473893","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,26]],"date-time":"2024-03-26T21:33:58Z","timestamp":1711488838000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10473893\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,22]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/asp-dac58780.2024.10473893","relation":{},"subject":[],"published":{"date-parts":[[2024,1,22]]}}}