{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T20:51:50Z","timestamp":1774471910013,"version":"3.50.1"},"reference-count":11,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,12]],"date-time":"2025-10-12T00:00:00Z","timestamp":1760227200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,12]],"date-time":"2025-10-12T00:00:00Z","timestamp":1760227200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,12]]},"DOI":"10.1109\/cvmi66673.2025.11337918","type":"proceedings-article","created":{"date-parts":[[2026,1,19]],"date-time":"2026-01-19T20:52:59Z","timestamp":1768855979000},"page":"1-5","source":"Crossref","is-referenced-by-count":0,"title":["Bringing Llama-3 to the Edge: End-to-End Quantized Conversational AI on Raspberry Pi 5"],"prefix":"10.1109","author":[{"given":"Saarang","family":"Arora","sequence":"first","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kishor Kumar","family":"Kachari","sequence":"additional","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Suyash","family":"Gupta","sequence":"additional","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Parth","family":"Saarthi","sequence":"additional","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Arpit Kumar","family":"Yadav","sequence":"additional","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Salur Srikant","family":"Patnaik","sequence":"additional","affiliation":[{"name":"AiGENTHix Technologies Pvt. Ltd.,R&#x0026;D Department,Bengaluru,India"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-54827-7_13"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.hcc.2024.100211"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-76631-2_3"},{"key":"ref4","first-page":"9459","article-title":"Retrieval-augmented generation for knowledge-intensive nlp tasks","volume":"33","author":"Lewis","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref5","article-title":"Parameter-efficient fine-tuning for large models: A comprehensive survey","author":"Han","year":"2024","journal-title":"arXiv preprint"},{"issue":"2","key":"ref6","first-page":"3","article-title":"Lora: Low-rank adaptation of large language models","volume":"1","author":"Hu","year":"2022","journal-title":"ICLR"},{"key":"ref7","first-page":"30318","article-title":"Gpt3. int8 (): 8-bit matrix multiplication for transformers at scale","volume":"35","author":"Dettmers","year":"2022","journal-title":"Advances in neural information processing systems"},{"key":"ref8","article-title":"Bertscore: Evaluating text generation with bert","author":"Zhang","year":"2019","journal-title":"arXiv preprint"},{"key":"ref9","first-page":"65","article-title":"Meteor: An automatic metric for mt evaluation with improved correlation with human judgments","volume-title":"Proceedings of the acl workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization","author":"Banerjee","year":"2005"},{"key":"ref10","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International conference on machine learning","author":"Radford","year":"2023"},{"key":"ref11","article-title":"Llama: Open and efficient foundation language models","author":"Touvron","year":"2023","journal-title":"arXiv preprint"}],"event":{"name":"2025 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","location":"Rourkela, India","start":{"date-parts":[[2025,10,12]]},"end":{"date-parts":[[2025,10,13]]}},"container-title":["2025 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11335417\/11337242\/11337918.pdf?arnumber=11337918","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T19:52:11Z","timestamp":1774468331000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11337918\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,12]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/cvmi66673.2025.11337918","relation":{},"subject":[],"published":{"date-parts":[[2025,10,12]]}}}