{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,2]],"date-time":"2025-07-02T04:06:58Z","timestamp":1751429218085,"version":"3.41.0"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T00:00:00Z","timestamp":1747094400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T00:00:00Z","timestamp":1747094400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,5,13]]},"DOI":"10.1109\/icmcis64378.2025.11048102","type":"proceedings-article","created":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T17:36:43Z","timestamp":1751305003000},"page":"1-10","source":"Crossref","is-referenced-by-count":0,"title":["Exploring Shared Large Language Models: Early Insights into Scalability and Efficiency in AI Assistant and Agent Deployment"],"prefix":"10.1109","author":[{"given":"Arvid","family":"Kok","sequence":"first","affiliation":[{"name":"NATO Communications and Information Agency,Data Science &#x0026; AI, CTO,The Hague,The Netherlands"}]},{"given":"Antonio","family":"Carvalho","sequence":"additional","affiliation":[{"name":"NATO Communications and Information Agency,Data Science &#x0026; AI, CTO,The Hague,The Netherlands"}]},{"given":"Michael","family":"Street","sequence":"additional","affiliation":[{"name":"NATO Communications and Information Agency,Data Science &#x0026; AI, CTO,The Hague,The Netherlands"}]}],"member":"263","reference":[{"journal-title":"Emerging architectures for LLM applications","year":"2023","author":"Horowitz","key":"ref1"},{"key":"ref2","article-title":"MonsterAPI Blog","author":"Bhasin","year":"2024","journal-title":"Top Open-Source LLMs for 2024 & Their Use-Cases"},{"volume-title":"Alienware Aurora gaming desktop","key":"ref3"},{"journal-title":"MARLIN: Mixed-Precision Auto-Regressive Parallel Inference on Large Language Models","year":"2024","author":"Frantar","key":"ref4"},{"journal-title":"LLM inference sizing and performance guidance. VMware","year":"2024","author":"Fu","key":"ref5"},{"journal-title":"Text Generation Inference (TGI)","year":"2024","key":"ref6"},{"journal-title":"Open API standard for open-source LLMs. Hugging Face Forums","year":"2023","key":"ref7"},{"volume-title":"Hugging Face model hub","year":"2024","key":"ref8"},{"volume-title":"Efficient Training of Large Language Models on Distributed Infrastructures: A Survey","year":"2024","author":"Jiangfei","key":"ref9"},{"journal-title":"A guide to LLM inference and performance. Baseten","year":"2024","author":"Kiely","key":"ref10"},{"journal-title":"A Scalable Communication Protocol for Networks of Large Language Models","year":"2024","author":"Lee","key":"ref11"},{"journal-title":"Llama: Open-source AI Models","key":"ref12"},{"journal-title":"Mistralai AI models","year":"2024","key":"ref13"},{"journal-title":"AI Solutions: The Most Advanced AI, Ready for Enterprise","key":"ref14"},{"journal-title":"NVIDIA Deep Learning Performance","key":"ref15"},{"journal-title":"Hyena Hierarchy: Towards Larger Convolutional Language Models","year":"2023","author":"Poli","key":"ref16"},{"journal-title":"Project Jupyter: JupyterLab","key":"ref17"},{"journal-title":"Achieving Peak Performance for Large Language Models: A Systematic Review","year":"2024","author":"Rzgar","key":"ref18"},{"volume-title":"Big-O notation. Wikipedia, The Free Encyclopedia","year":"2024","key":"ref19"},{"journal-title":"HuggingFace\u2019s Transformers: State-of-the-art Natural Language Processing","year":"2020","author":"Wolf","key":"ref20"}],"event":{"name":"2025 International Conference on Military Communication and Information Systems (ICMCIS)","start":{"date-parts":[[2025,5,13]]},"location":"Oerias, Portugal","end":{"date-parts":[[2025,5,14]]}},"container-title":["2025 International Conference on Military Communication and Information Systems (ICMCIS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11047255\/11047555\/11048102.pdf?arnumber=11048102","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,1]],"date-time":"2025-07-01T06:07:47Z","timestamp":1751350067000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11048102\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,13]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/icmcis64378.2025.11048102","relation":{},"subject":[],"published":{"date-parts":[[2025,5,13]]}}}