{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,20]],"date-time":"2026-04-20T23:49:15Z","timestamp":1776728955603,"version":"3.51.2"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031877773","type":"print"},{"value":"9783031877780","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-87778-0_19","type":"book-chapter","created":{"date-parts":[[2025,4,15]],"date-time":"2025-04-15T16:22:55Z","timestamp":1744734175000},"page":"196-205","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Deploying Large Language Model on\u00a0Cloud-Edge Architectures: A Case Study for\u00a0Conversational Historical Characters"],"prefix":"10.1007","author":[{"given":"Mariangela","family":"Graziano","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luigi","family":"Colucci Cante","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Beniamino","family":"Di Martino","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,4,16]]},"reference":[{"issue":"1","key":"19_CR1","doi-asserted-by":"crossref","first-page":"01","DOI":"10.51317\/ecjecs.v1i1.458","volume":"1","author":"J Abrera","year":"2024","unstructured":"Abrera, J., et al.: Data privacy and security in cloud computing: a comprehensive review. J. Comput. Sci. Inform. Technol. 1(1), 01\u201309 (2024)","journal-title":"J. Comput. Sci. Inform. Technol."},{"key":"19_CR2","doi-asserted-by":"crossref","unstructured":"Alkaeed, M., Qayyum, A., Qadir, J.: Privacy preservation in artificial intelligence and extended reality (ai-xr) metaverses: a survey. J. Netw. Comput. Appli., 103989 (2024)","DOI":"10.1016\/j.jnca.2024.103989"},{"key":"19_CR3","unstructured":"Baktash, J.A., Dawodi, M.: Gpt-4: A review on advancements and opportunities in natural language processing. arXiv preprint arXiv:2305.03195 (2023)"},{"key":"19_CR4","doi-asserted-by":"crossref","unstructured":"Cantiello, p., Di\u00a0Martino, B., Mastroianni, M., Cante, L.C., Graziano, M.: Towards a cloud model choice evaluation: comparison between cost\/features and ontology-based analysis. Inter. J. Grid Utility Comput. (2022)","DOI":"10.1504\/IJGUC.2023.10054821"},{"key":"19_CR5","doi-asserted-by":"crossref","unstructured":"Di Martino, B., Cante, L.C., Esposito, A., Graziano, M.: Towards a methodology for the semantic representation of iot sensors and bpmns to discover business process patterns: a smart irrigation case study. In: Barolli, L. (ed.) Advances on Broad-Band Wireless Computing, Communication and Applications, pp. 248\u2013258. Springer International Publishing, Cham (2023)","DOI":"10.1007\/978-3-031-20029-8_24"},{"key":"19_CR6","series-title":"Lecture Notes in Networks and Systems","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1007\/978-3-030-99619-2_15","volume-title":"Advanced Information Networking and Applications","author":"B Di Martino","year":"2022","unstructured":"Di Martino, B., Colucci Cante, L., Cerullo, N.: Opportunities and advantages of cloud migration of a smart restaurant system. In: Barolli, L., Hussain, F., Enokido, T. (eds.) AINA 2022. LNNS, vol. 451, pp. 153\u2013162. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-030-99619-2_15"},{"key":"19_CR7","series-title":"Lecture Notes in Networks and Systems","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1007\/978-3-030-99619-2_16","volume-title":"Advanced Information Networking and Applications","author":"B Di Martino","year":"2022","unstructured":"Di Martino, B., Graziano, M., Colucci Cante, L., Cascone, D.: Analysis of\u00a0techniques for\u00a0mapping convolutional neural networks onto\u00a0cloud edge architectures using splitfed learning method. In: Barolli, L., Hussain, F., Enokido, T. (eds.) AINA 2022. LNNS, vol. 451, pp. 163\u2013172. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-030-99619-2_16"},{"issue":"1","key":"19_CR8","doi-asserted-by":"publisher","first-page":"591","DOI":"10.1109\/COMST.2022.3218527","volume":"25","author":"S Duan","year":"2022","unstructured":"Duan, S., Dan Wang, J., Ren, F.L., Zhang, Y., Huaqing, W., Shen, X.: Distributed artificial intelligence empowered by end-edge-cloud computing: a survey. IEEE Commun. Surv. Tutorials 25(1), 591\u2013624 (2022)","journal-title":"IEEE Commun. Surv. Tutorials"},{"key":"19_CR9","unstructured":"Fernandez, R.S., et al.:Seeping semantics: linking datasets using word embeddings for data discovery. In: 2018 IEEE 34th International Conference on Data Engineering (ICDE), pp. 989\u20131000. IEEE (2018)"},{"key":"19_CR10","doi-asserted-by":"crossref","unstructured":"Fran\u00e7a, R.P., Bonacin, R., Monteiro, A.C.B.: An overview of data privacy and security in cloud platforms: Exploring the intersection of digital technologies currently. Digital Cultural Heritage, pp. 21\u201339 (2024)","DOI":"10.1201\/9781032630564-2"},{"key":"19_CR11","doi-asserted-by":"crossref","unstructured":"Friha, O., Ferrag, M.A., Kantarci, B., Cakmak, B., Ozgun, A., Ghoualmi-Zine, N.: Llm-based edge intelligence: a comprehensive survey on architectures, applications, security and trustworthiness. IEEE Open Journal of the Communications Society (2024)","DOI":"10.1109\/OJCOMS.2024.3456549"},{"key":"19_CR12","doi-asserted-by":"crossref","unstructured":"Hu, Y., Ye, D., Kang, J., Wu, M., Yu, R.: A cloud-edge collaborative architecture for multimodal llms-based advanced driver assistance systems in iot networks. IEEE Internet of Things J. (2024)","DOI":"10.1109\/JIOT.2024.3509628"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Islam, R., Ahmed, I.: Gemini-the most powerful llm: Myth or truth. In: 2024 5th Information Communication Technologies Conference (ICTC), pp. 303\u2013308 (2024)","DOI":"10.1109\/ICTC61510.2024.10602253"},{"key":"19_CR14","unstructured":"Jiang, A.Q., et\u00a0al.: Mistral 7b. arXiv preprint arXiv:2310.06825 (2023)"},{"key":"19_CR15","unstructured":"Jin, H., Wu, Y.: Ce-collm: efficient and adaptive large language models through cloud-edge collaboration. arXiv preprint arXiv:2411.02829 (2024)"},{"key":"19_CR16","doi-asserted-by":"crossref","unstructured":"Laskaridis, S., Katevas, K., Minto, L., Haddadi, H.: Melting point: mobile evaluation of language transformers. In: Proceedings of the 30th Annual International Conference on Mobile Computing and Networking, pp. 890\u2013907 (2024)","DOI":"10.1145\/3636534.3690668"},{"key":"19_CR17","unstructured":"Lee, J.S.: Lexgpt 0.1: pre-trained gpt-j models with pile of law. arXiv preprint arXiv:2306.05431 (2023)"},{"issue":"4","key":"19_CR18","doi-asserted-by":"publisher","first-page":"59","DOI":"10.55524\/ijircst.2024.12.4.10","volume":"12","author":"H Li","year":"2024","unstructured":"Li, H., Wang, S.X., Shang, F., Niu, K., Song, R.: Applications of large language models in cloud computing: an empirical study using real-world data. Intern. J. Innovative Res. Comput. Sci. Technol. 12(4), 59\u201369 (2024)","journal-title":"Intern. J. Innovative Res. Comput. Sci. Technol."},{"key":"19_CR19","doi-asserted-by":"crossref","unstructured":"Qu, G., Chen, Q., Wei, W., Lin, Z., Chen, X., Huang, K.: Mobile edge intelligence for large language models: A contemporary survey. arXiv preprint arXiv:2407.18921 (2024)","DOI":"10.36227\/techrxiv.172115025.57884352\/v1"},{"key":"19_CR20","doi-asserted-by":"crossref","unstructured":"Rao, K., Coviello, G., Benedetti, P., ]De\u00a0Vita, C.G., Mellone, G., Chakradhar, S.: Eco-llm: Llm-based edge cloud optimization. In: Proceedings of the 2024 Workshop on AI For Systems, pp. 7\u201312 (2024)","DOI":"10.1145\/3660605.3660941"},{"key":"19_CR21","unstructured":"Sanh, V.: Distilbert, a distilled version of bert: smaller, faster, cheaper and lighter. arXiv preprint arXiv:1910.01108 (2019)"},{"issue":"10","key":"19_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3659097","volume":"56","author":"P Souza","year":"2024","unstructured":"Souza, P., Ferreto, T., Calheiros, R.: Maintenance operations on cloud, edge, and iot environments: taxonomy, survey, and research challenges. ACM Comput. Surv. 56(10), 1\u201338 (2024)","journal-title":"ACM Comput. Surv."},{"key":"19_CR23","unstructured":"Team, G., et\u00a0al. Gemini: a family of highly capable multimodal models. arXiv preprint arXiv:2312.11805 (2023)"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Wang, B., Wang, S., Ouyang, Q.: Probabilistic inference layer integration in mistral llm for accurate information retrieval (2024)","DOI":"10.21203\/rs.3.rs-3828707\/v1"},{"key":"19_CR25","unstructured":"Xu, J., et al.:On-device language models: a comprehensive review. arXiv preprint arXiv:2409.00088 (2024)"},{"key":"19_CR26","doi-asserted-by":"crossref","unstructured":"Yang, F., et al.: Efficient deployment of large language model across cloud-device systems. In: 2024 IEEE 37th International System-on-Chip Conference (SOCC), pp. 1\u20136. IEEE (2024)","DOI":"10.1109\/SOCC62300.2024.10737825"},{"key":"19_CR27","unstructured":"Yuan, Z., Li, Z., Huang, W., Ye, Y., Sun, L.: Tinygpt-v: Efficient multimodal large language model via small backbones. arXiv preprint arXiv:2312.16862 (2023)"},{"key":"19_CR28","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2024.109758","volume":"120","author":"X Zhai","year":"2024","unstructured":"Zhai, X., Peng, Y., Guo, X.: Edge-cloud collaboration for low-latency, low-carbon, and cost-efficient operations. Comput. Electr. Eng. 120, 109758 (2024)","journal-title":"Comput. Electr. Eng."},{"key":"19_CR29","doi-asserted-by":"crossref","unstructured":"Zhang, M., Shen, X., Cao, J., Cui, Z., Jiang, S.: Edgeshard: efficient llm inference via collaborative edge computing. IEEE Internet of Things Journal (2024)","DOI":"10.1109\/JIOT.2024.3524255"},{"key":"19_CR30","unstructured":"Zhang*, T., Kishore*, V., Wu*, F., Weinberger, K.Q., Artzi, Y.: Bertscore: evaluating text generation with bert. In: International Conference on Learning Representations (2020)"},{"key":"19_CR31","unstructured":"Zheng, Y., Chen, Y., Qian, B., Shi, X., Shu, Y., Chen, J.: A review on edge large language models: Design, execution, and applications. arXiv preprint arXiv:2410.11845 (2024)"}],"container-title":["Lecture Notes on Data Engineering and Communications Technologies","Advanced Information Networking and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-87778-0_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,15]],"date-time":"2025-04-15T16:23:09Z","timestamp":1744734189000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-87778-0_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031877773","9783031877780"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-87778-0_19","relation":{},"ISSN":["2367-4512","2367-4520"],"issn-type":[{"value":"2367-4512","type":"print"},{"value":"2367-4520","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"16 April 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AINA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Information Networking and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Barcelona","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 April 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 April 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"39","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aina0","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/voyager.ce.fit.ac.jp\/conf\/aina\/2025\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}