{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T04:03:20Z","timestamp":1749528200808,"version":"3.41.0"},"publisher-location":"Cham","reference-count":18,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031902024","type":"print"},{"value":"9783031902031","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-90203-1_21","type":"book-chapter","created":{"date-parts":[[2025,6,9]],"date-time":"2025-06-09T15:48:57Z","timestamp":1749484137000},"page":"243-255","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Efficient Deployment and\u00a0Fine-Tuning of\u00a0Transformer-Based Models on\u00a0the\u00a0Device-Edge"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-0855-8909","authenticated-orcid":false,"given":"Hongfeng","family":"Li","sequence":"first","affiliation":[]},{"given":"Geming","family":"Xia","sequence":"additional","affiliation":[]},{"given":"Yuze","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Zhiping","family":"Cai","sequence":"additional","affiliation":[]},{"given":"Hongcheng","family":"Li","sequence":"additional","affiliation":[]},{"given":"Chaodong","family":"Yu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,6,10]]},"reference":[{"key":"21_CR1","unstructured":"Chaodong, Y., Jian, C., Xia, G., Zhaohang, W.: Adaptive asynchronous federated learning for edge intelligence. In: 2021 International Conference on Machine Learning and Intelligent Systems Engineering, MLISE 2021 (2021)"},{"key":"21_CR2","doi-asserted-by":"crossref","unstructured":"Ahmed, A., Ahmed, E.: A survey on mobile edge computing. In: 2016 10th International Conference on Intelligent Systems and Control (ISCO), pp.\u00a01\u20138 (2016)","DOI":"10.1109\/ISCO.2016.7727082"},{"key":"21_CR3","doi-asserted-by":"crossref","unstructured":"Lin, T., Wang, Y., Liu, X., Qiu, X.: A survey of transformers. AI Open 3, 111\u2013132 (2021). https:\/\/api.semanticscholar.org\/CorpusID:235368340","DOI":"10.1016\/j.aiopen.2022.10.001"},{"key":"21_CR4","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: Bert: pre-training of deep bidirectional transformers for language understanding (2019)"},{"key":"21_CR5","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Houlsby, N.: An image is worth 16x16 words: transformers for image recognition at scale (2020)"},{"key":"21_CR6","unstructured":"Konen, J., Mcmahan, B., Ramage, D.: Federated optimization: distributed optimization beyond the datacenter. Mathematics (2015)"},{"key":"21_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.jnca.2018.05.003","volume":"116","author":"O Gupta","year":"2018","unstructured":"Gupta, O., Raskar, R.: Distributed learning of deep neural network over multiple agents. J. Netw. Comput. Appl. 116, 1\u20138 (2018)","journal-title":"J. Netw. Comput. Appl."},{"key":"21_CR8","unstructured":"Shi, S., Yang, Q., Xiang, Y., Qi, S., Wang, X.: An efficient split fine-tuning framework for edge and cloud collaborative learning (2022)"},{"key":"21_CR9","doi-asserted-by":"crossref","unstructured":"Vucetic, D., Tayaranian, M., Ziaeefard, M., Clark, J.J., Meyer, B.H., Gross, W.J.: Efficient fine-tuning of bert models on the edge. In: 2022 IEEE International Symposium on Circuits and Systems (ISCAS), pp. 1838\u20131842. IEEE (2022)","DOI":"10.1109\/ISCAS48785.2022.9937567"},{"key":"21_CR10","unstructured":"Houlsby, N., et al.: Parameter-efficient transfer learning for NLP. In: Chaudhuri, K., Salakhutdinov, R. (eds.) Proceedings of the 36th International Conference on Machine Learning. Proceedings of Machine Learning Research, vol.\u00a097, pp. 2790\u20132799. PMLR (2019)"},{"key":"21_CR11","unstructured":"Hu, E.J., et al.: Lora: low-rank adaptation of large language models (2021)"},{"key":"21_CR12","doi-asserted-by":"crossref","unstructured":"Du, M., Yue, X., Chow, S.S.M., Wang, T., Huang, C., Sun, H.: Dp-forward: fine-tuning and inference on language models with differential privacy in forward pass. In: Proceedings of the 2023 ACM SIGSAC Conference on Computer and Communications Security, CCS \u201923, pp. 2665\u20132679 (2023)","DOI":"10.1145\/3576915.3616592"},{"issue":"6","key":"21_CR13","doi-asserted-by":"publisher","first-page":"4270","DOI":"10.1109\/TDSC.2021.3126315","volume":"19","author":"J Hou","year":"2022","unstructured":"Hou, J., Liu, H., Liu, Y., Wang, Y., Wan, P.J., Li, X.Y.: Model protection: real-time privacy-preserving inference service for model privacy at the edge. IEEE Trans. Dependable Secure Comput. 19(6), 4270\u20134284 (2022)","journal-title":"IEEE Trans. Dependable Secure Comput."},{"key":"21_CR14","doi-asserted-by":"crossref","unstructured":"Touvron, H., Cord, M., El-Nouby, A., Verbeek, J., J\u00e9gou, H.: Three things everyone should know about vision transformers. In: Computer Vision \u2013 ECCV 2022: 17th European Conference, Tel Aviv, Israel, 23\u201327 October 2022, p. 497\u2013515 (2022)","DOI":"10.1007\/978-3-031-20053-3_29"},{"key":"21_CR15","doi-asserted-by":"crossref","unstructured":"Ben\u00a0Zaken, E., Goldberg, Y., Ravfogel, S.: BitFit: Simple parameter-efficient fine-tuning for transformer-based masked language-models. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics. pp.\u00a01\u20139. Association for Computational Linguistics, Dublin (2022)","DOI":"10.18653\/v1\/2022.acl-short.1"},{"key":"21_CR16","doi-asserted-by":"crossref","unstructured":"Wang, A., Singh, A., Michael, J., Hill, F., Levy, O., Bowman, S.R.: Glue: a multi-task benchmark and analysis platform for natural language understanding. In: BlackboxNLP@EMNLP (2018)","DOI":"10.18653\/v1\/W18-5446"},{"key":"21_CR17","unstructured":"Krizhevsky, A.: Learning multiple layers of features from tiny images (2009). https:\/\/api.semanticscholar.org\/CorpusID:18268744"},{"key":"21_CR18","doi-asserted-by":"crossref","unstructured":"Nilsback, M.E., Zisserman, A.: Automated flower classification over a large number of classes. In: 2008 Sixth Indian Conference on Computer Vision, Graphics & Image Processing, pp. 722\u2013729 (2008)","DOI":"10.1109\/ICVGIP.2008.47"}],"container-title":["Lecture Notes in Computer Science","Euro-Par 2024: Parallel Processing Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-90203-1_21","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,9]],"date-time":"2025-06-09T15:49:06Z","timestamp":1749484146000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-90203-1_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031902024","9783031902031"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-90203-1_21","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"10 June 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"Euro-Par","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Parallel Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Madrid","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 August 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 August 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"europar2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2024.euro-par.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}