{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,20]],"date-time":"2026-02-20T18:52:55Z","timestamp":1771613575815,"version":"3.50.1"},"reference-count":42,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,5,27]],"date-time":"2024-05-27T00:00:00Z","timestamp":1716768000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,5,27]],"date-time":"2024-05-27T00:00:00Z","timestamp":1716768000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,27]]},"DOI":"10.1109\/icbc59979.2024.10634448","type":"proceedings-article","created":{"date-parts":[[2024,8,21]],"date-time":"2024-08-21T22:53:39Z","timestamp":1724280819000},"page":"1-7","source":"Crossref","is-referenced-by-count":2,"title":["Trusted LLM Inference on the Edge with Smart Contracts"],"prefix":"10.1109","author":[{"given":"Rabimba","family":"Karanjai","sequence":"first","affiliation":[{"name":"University Of Houston,Department Of Computer Science"}]},{"given":"Weidong","family":"Shi","sequence":"additional","affiliation":[{"name":"University Of Houston,Department Of Computer Science"}]}],"member":"263","reference":[{"key":"ref1","first-page":"1877","article-title":"Language models are few-shot learners","volume":"33","author":"Brown","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref2","article-title":"Palm 2 technical report","volume-title":"arXiv preprint arXiv:2305.10403","author":"Anil","year":"2023"},{"key":"ref3","article-title":"Exploring the benefits of training expert language models over instruction tuning","author":"Jang","year":"2023"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3511861.3511863"},{"key":"ref5","article-title":"Uniswap trading volume exploded by 450 % to 7 billion. here\u2019s why","author":"Benson","year":"2021"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3505253.3505259"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICBC56567.2023.10174906"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICBC56567.2023.10174945"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3464298.3493401"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICBC51069.2021.9461133"},{"key":"ref11","article-title":"Cosmos whitepaper","volume":"27","author":"Kwon","year":"2019","journal-title":"A Netw. Distrib. Ledgers"},{"key":"ref12","doi-asserted-by":"crossref","DOI":"10.2139\/ssrn.3647625","article-title":"Ai in finance: A review","author":"Cao","year":"2020"},{"key":"ref13","doi-asserted-by":"crossref","DOI":"10.2139\/ssrn.4511540","article-title":"Large language models and generative ai in finance: An analysis of chatgpt, bard, and bing ai","author":"Krause","year":"2023"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref15","first-page":"443","article-title":"Serving DNNs like clockwork: Performance predictability from the bottom up","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20)","author":"Gujarati"},{"key":"ref16","article-title":"Tensorflowserving: Flexible, high-performance ml serving","author":"Olston","year":"2017","journal-title":"arXiv preprint arXiv:1712.06139"},{"key":"ref17","article-title":"The triton inference server","year":"2024"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-4009"},{"key":"ref19","article-title":"Huggingface\u2019s transformers: State-of-the-art natural language processing","author":"Wolf","year":"2019","journal-title":"arXiv preprint arXiv:1910.03771"},{"key":"ref20","article-title":"Faster transformer decoding: N-gram masked self-attention","author":"Chelba","year":"2020","journal-title":"arXiv preprint arXiv:2001.04589"},{"key":"ref21","first-page":"521538","article-title":"Orca: A distributed serving system for Transformer-Based generative models","volume-title":"16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)","author":"Yu"},{"key":"ref22","article-title":"Bitcoin: A peer-to-peer electronic cash system","author":"Nakamoto","year":"2008","journal-title":"Decentralized business review"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/tnsm.2024.3357824"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/SPW.2015.27"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2022.3204702"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.23919\/FRUCT54823.2022.9770931"},{"key":"ref27","article-title":"Embedded development boards for edge-ai: A comprehensive report","volume-title":"arXiv preprint arXiv:2009.00803","author":"Imran","year":"2020"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.3390\/s20092533"},{"key":"ref29","volume-title":"Cosmwasm: Basic cosmos-sdk app with web assembly smart contracts","year":"2024"},{"key":"ref30","volume-title":"Ethermint","year":"2024"},{"key":"ref31","volume-title":"Wasmedge","year":"2024"},{"key":"ref32","article-title":"Standardizing wasi: A system interface to run webassembly outside the web","author":"Clark","year":"2019","journal-title":"Mozilla Hacks-the Web developer blog"},{"key":"ref33","article-title":"Vm matters: a comparison of wasm vms and evms in the performance of blockchain smart contracts","author":"Zheng","year":"2020","journal-title":"arXiv preprint arXiv:2012.01032"},{"key":"ref34","volume-title":"cw-contracts","year":"2024"},{"key":"ref35","article-title":"Gemini a family of highly capable multimodal models","author":"Team","year":"2023","journal-title":"arXiv preprint arXiv:2312.11805"},{"key":"ref36","article-title":"lightweight, standalone c++ inference engine for google\u2019s gemma models","year":"2024"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3532720.3535625"},{"key":"ref38","volume-title":"wgpu: Cross-platform, safe, pure-rust graphics api","year":"2024"},{"key":"ref39","volume-title":"llama2.c: Inference llama 2 in one file of pure c","year":"2024"},{"key":"ref40","volume-title":"llama.cpp: Port of facebook\u2019s llama model in c\/c++","year":"2024"},{"key":"ref41","volume-title":"Wasmedge-wasinn","year":"2024"},{"key":"ref42","article-title":"Visual instruction tuning","author":"Liu","year":"2023","journal-title":"NeurIPS"}],"event":{"name":"2024 IEEE International Conference on Blockchain and Cryptocurrency (ICBC)","location":"Dublin, Ireland","start":{"date-parts":[[2024,5,27]]},"end":{"date-parts":[[2024,5,31]]}},"container-title":["2024 IEEE International Conference on Blockchain and Cryptocurrency (ICBC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10634319\/10634334\/10634448.pdf?arnumber=10634448","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T04:59:06Z","timestamp":1725339546000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10634448\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,27]]},"references-count":42,"URL":"https:\/\/doi.org\/10.1109\/icbc59979.2024.10634448","relation":{},"subject":[],"published":{"date-parts":[[2024,5,27]]}}}