{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T07:27:07Z","timestamp":1775546827158,"version":"3.50.1"},"publisher-location":"Cham","reference-count":13,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031764516","type":"print"},{"value":"9783031764523","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,12]],"date-time":"2024-11-12T00:00:00Z","timestamp":1731369600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,12]],"date-time":"2024-11-12T00:00:00Z","timestamp":1731369600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-76452-3_24","type":"book-chapter","created":{"date-parts":[[2024,11,11]],"date-time":"2024-11-11T16:46:48Z","timestamp":1731343608000},"page":"252-262","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Performance of\u00a0LLMs on\u00a0Computing Systems for\u00a0Deployment in\u00a0IoT Devices"],"prefix":"10.1007","author":[{"given":"Theodor-Radu","family":"Grumeza","sequence":"first","affiliation":[]},{"given":"Thomas-Andrei","family":"Laz\u00e3r","sequence":"additional","affiliation":[]},{"given":"Alexandra-Emilia","family":"Forti\u015f","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,12]]},"reference":[{"key":"24_CR1","unstructured":"Zhao, W.X., et al: A survey of large language models, Peiyu Liu (2023)"},{"key":"24_CR2","unstructured":"Hoffmann, J., et al.: Training compute-optimal large language models. arXiv preprint arXiv:2203.15556 (2022)"},{"key":"24_CR3","unstructured":"Vailshery, L.S.: Number of internet of things (IoT) connections worldwide from 2022 to 2023, with forecasts from 2024 to 2033 (2024)"},{"key":"24_CR4","doi-asserted-by":"crossref","unstructured":"Barbella, M., Tortora, G.: Rouge metric evaluation for text summarization techniques. Available at SSRN 4120317 (2022)","DOI":"10.2139\/ssrn.4120317"},{"issue":"10","key":"24_CR5","doi-asserted-by":"publisher","first-page":"574","DOI":"10.3390\/info14100574","volume":"14","author":"J Son","year":"2023","unstructured":"Son, J., Kim, B.: Translation performance from the user\u2019s perspective of large language models and neural machine translation systems. Information 14(10), 574 (2023)","journal-title":"Information"},{"key":"24_CR6","unstructured":"Sheng, Y., et al.: Flexgen: high-throughput generative inference of large language models with a single GPU. In: International Conference on Machine Learning, pp. 31094\u201331116. PMLR (2023)"},{"key":"24_CR7","doi-asserted-by":"crossref","unstructured":"Dhar, N., Deng, B., Lo, D., Wu, X., Zhao, L., Suo, K.: An empirical analysis and resource footprint study of deploying large language models on edge devices. In: Proceedings of the 2024 ACM Southeast Conference, ACM SE 2024, pp. 69\u201376, New York, NY, USA, Association for Computing Machinery (2024)","DOI":"10.1145\/3603287.3651205"},{"key":"24_CR8","unstructured":"Sikorski, P.,et al.: Deployment of NLP and LLM techniques to control mobile robots at the edge: a case study using GPT-4-turbo and llama, February 2024"},{"key":"24_CR9","doi-asserted-by":"crossref","unstructured":"Lewis, M., et al.: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension, Bart (2019)","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"24_CR10","unstructured":"Wang, A., Cho, K.: Bert has a mouth, and it must speak: bert as a markov random field language model. arXiv preprint arXiv:1902.04094 (2019)"},{"key":"24_CR11","doi-asserted-by":"crossref","unstructured":"Xiong, X., Zheng, M.: GPT-neo-CRV: Elevating information accuracy in GPT-neo with cross-referential validation. Authorea Preprints (2024)","DOI":"10.36227\/techrxiv.170473976.61241065\/v1"},{"key":"24_CR12","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. CoRR, abs\/1810.04805 (2018)"},{"key":"24_CR13","unstructured":"Bisht, T.: iamtarun python code instructions 18k alpaca (2023)"}],"container-title":["Lecture Notes on Data Engineering and Communications Technologies","Advances on Broad-Band Wireless Computing, Communication and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-76452-3_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,11]],"date-time":"2024-11-11T17:05:51Z","timestamp":1731344751000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-76452-3_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,12]]},"ISBN":["9783031764516","9783031764523"],"references-count":13,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-76452-3_24","relation":{},"ISSN":["2367-4512","2367-4520"],"issn-type":[{"value":"2367-4512","type":"print"},{"value":"2367-4520","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,12]]},"assertion":[{"value":"12 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"BWCCA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Broadband and Wireless Computing, Communication and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"San Benedetto del Tronto","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"bwcca2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/voyager.ce.fit.ac.jp\/conf\/bwcca\/2024\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}