{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T16:18:53Z","timestamp":1781021933754,"version":"3.54.1"},"reference-count":39,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,4,6]]},"DOI":"10.1109\/icassp49660.2025.10889971","type":"proceedings-article","created":{"date-parts":[[2025,3,12]],"date-time":"2025-03-12T17:15:19Z","timestamp":1741799719000},"page":"1-5","source":"Crossref","is-referenced-by-count":3,"title":["CE-FFT: Communication-Efficient Federated Fine-Tuning for Large Language Models via Quantization and In-Context Learning"],"prefix":"10.1109","author":[{"given":"Pengyu","family":"Zhang","sequence":"first","affiliation":[{"name":"East China Normal University,MoE Engineering Research Center of SW\/HW Co-Design Technology and Application"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yingjie","family":"Liu","sequence":"additional","affiliation":[{"name":"East China Normal University,MoE Engineering Research Center of SW\/HW Co-Design Technology and Application"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yingbo","family":"Zhou","sequence":"additional","affiliation":[{"name":"East China Normal University,MoE Engineering Research Center of SW\/HW Co-Design Technology and Application"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ming","family":"Hu","sequence":"additional","affiliation":[{"name":"Singapore Management University,School of Computing and Information Systems"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xian","family":"Wei","sequence":"additional","affiliation":[{"name":"East China Normal University,MoE Engineering Research Center of SW\/HW Co-Design Technology and Application"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mingsong","family":"Chen","sequence":"additional","affiliation":[{"name":"East China Normal University,MoE Engineering Research Center of SW\/HW Co-Design Technology and Application"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447454"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671582"},{"key":"ref3","doi-asserted-by":"crossref","DOI":"10.36227\/techrxiv.173272996.63900291\/v1","article-title":"Automated federated pipeline for parameter-efficient fine-tuning of large language models","author":"Fang","year":"2024"},{"key":"ref4","first-page":"2790","article-title":"Parameter-efficient transfer learning for nlp","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"Houlsby"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-short.8"},{"key":"ref6","article-title":"Lora: Low-rank adaptation of large language models","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"Hu"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447004"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-short.107"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.319"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447662"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10229032"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10229061"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10229029"},{"key":"ref14","first-page":"8253","article-title":"Fetchsgd: Communication-efficient federated learning with sketching","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"Rothchild"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10446879"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM53939.2023.10228970"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054168"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10447045"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM48880.2022.9796982"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2020.3046971"},{"key":"ref21","article-title":"Personalized federated instruction tuning via neural architecture search","author":"Zhang","year":"2024"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/RTSS59052.2023.00022"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671722"},{"key":"ref24","article-title":"Dual-personalizing adapter for federated foundation models","author":"Yang","year":"2024"},{"key":"ref25","first-page":"24 824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume-title":"Proceedings of Advances in Neural Information Processing Systems (NeurIPS)","volume":"35","author":"Wei"},{"key":"ref26","article-title":"Tree of thoughts: Deliberate problem solving with large language models","volume-title":"Proceedings of Advances in Neural Information Processing Systems (NeurIPS)","volume":"36","author":"Yao"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.64"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.58"},{"issue":"3","key":"ref29","first-page":"6","article-title":"Vicuna: An open-source chatbot impressing gpt-4 with 90%* chatgpt quality","volume":"2","author":"Chiang","year":"2023"},{"key":"ref30","article-title":"Code alpaca: An instruction-following llama model for code generation","author":"Chaudhary","year":"2023","journal-title":"Code alpaca: An instruction-following llama model for code generation"},{"key":"ref31","first-page":"22 631","article-title":"The flan collection: Designing data and methods for effective instruction tuning","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"Longpre"},{"key":"ref32","article-title":"OPTQ: Accurate quantization for generative pre-trained transformers","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"Frantar"},{"key":"ref33","first-page":"87","article-title":"Awq: Activation-aware weight quantization for on-device llm compression and acceleration","volume-title":"Proceedings of Machine Learning and Systems (LMSys)","volume":"6","author":"Lin"},{"key":"ref34","first-page":"38 087","article-title":"Smoothquant: Accurate and efficient post-training quantization for large language models","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"Xiao"},{"key":"ref35","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"ref36","article-title":"Qlora: Efficient finetuning of quantized llms","volume-title":"Proceedings of Advances in Neural Information Processing Systems (NeurIPS)","volume":"36","author":"Dettmers"},{"key":"ref37","article-title":"Sgdr: Stochastic gradient descent with warm restarts","author":"Loshchilov","year":"2016"},{"key":"ref38","article-title":"Relora: High-rank training through low-rank updates","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"Lialin"},{"key":"ref39","first-page":"18 250","article-title":"Generalized federated learning via sharpness aware minimization","volume-title":"Proceedings of International conference on machine learning (ICML)","author":"Qu"}],"event":{"name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Hyderabad, India","start":{"date-parts":[[2025,4,6]]},"end":{"date-parts":[[2025,4,11]]}},"container-title":["ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10887540\/10887541\/10889971.pdf?arnumber=10889971","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T05:22:49Z","timestamp":1774416169000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10889971\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,6]]},"references-count":39,"URL":"https:\/\/doi.org\/10.1109\/icassp49660.2025.10889971","relation":{},"subject":[],"published":{"date-parts":[[2025,4,6]]}}}