{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T22:26:06Z","timestamp":1766269566482,"version":"3.40.3"},"publisher-location":"Singapore","reference-count":33,"publisher":"Springer Nature Singapore","isbn-type":[{"type":"print","value":"9789819608102"},{"type":"electronic","value":"9789819608119"}],"license":[{"start":{"date-parts":[[2024,12,13]],"date-time":"2024-12-13T00:00:00Z","timestamp":1734048000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,13]],"date-time":"2024-12-13T00:00:00Z","timestamp":1734048000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-0811-9_20","type":"book-chapter","created":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T17:28:57Z","timestamp":1734024537000},"page":"283-299","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["An Inference Acceleration Approach for\u00a0Boosting DNN Cold Start in\u00a0Cloud-Edge Computing"],"prefix":"10.1007","author":[{"given":"Hao","family":"Tian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haolong","family":"Xiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tingtong","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Siyuan","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cheng","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zheng","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mingxu","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wanchun","family":"Dou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,12,13]]},"reference":[{"key":"20_CR1","doi-asserted-by":"crossref","unstructured":"Awerbuch, B., Azar, Y., Epstein, A.: The price of routing unsplittable flow. In: Proceedings of the Thirty-Seventh Annual ACM Symposium on Theory of Computing, pp. 57\u201366 (2005)","DOI":"10.1145\/1060590.1060599"},{"issue":"8","key":"20_CR2","doi-asserted-by":"publisher","first-page":"8037","DOI":"10.1109\/TVT.2021.3090246","volume":"70","author":"J Chen","year":"2021","unstructured":"Chen, J., Chang, Z., Guo, X., Li, R., Han, Z., H\u00e4m\u00e4l\u00e4inen, T.: Resource allocation and computation offloading for multi-access edge computing with fronthaul and backhaul constraints. IEEE Trans. Veh. Technol. 70(8), 8037\u20138049 (2021)","journal-title":"IEEE Trans. Veh. Technol."},{"issue":"12","key":"20_CR3","doi-asserted-by":"publisher","first-page":"10146","DOI":"10.1109\/JIOT.2023.3237361","volume":"10","author":"W Fan","year":"2023","unstructured":"Fan, W., Gao, L., Su, Y., Wu, F., Liu, Y.: Joint DNN partition and resource allocation for task offloading in edge-cloud-assisted IoT environments. IEEE Internet Things J. 10(12), 10146\u201310159 (2023)","journal-title":"IEEE Internet Things J."},{"key":"20_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1007\/978-3-319-13129-0_3","volume-title":"Web and Internet Economics","author":"M Feldotto","year":"2014","unstructured":"Feldotto, M., Gairing, M., Skopalik, A.: Bounding the potential function in congestion games and approximate pure Nash equilibria. In: Liu, T.-Y., Qi, Q., Ye, Y. (eds.) WINE 2014. LNCS, vol. 8877, pp. 30\u201343. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-13129-0_3"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"Fu, S., Dong, F., Shen, D., He, Q.: Joint quality evaluation, model splitting and resource provisioning for split edge learning. In: 2023 20th Annual IEEE International Conference on Sensing, Communication, and Networking (SECON), pp. 420\u2013428. IEEE (2023)","DOI":"10.1109\/SECON58729.2023.10287470"},{"issue":"3","key":"20_CR6","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TPDS.2019.2938944","volume":"31","author":"Q He","year":"2019","unstructured":"He, Q., et al.: A game-theoretical approach for user allocation in edge computing environment. IEEE Trans. Parallel Distrib. Syst. 31(3), 515\u2013529 (2019)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"20_CR7","doi-asserted-by":"crossref","unstructured":"Hong, Z., Lin, J., Guo, S., Luo, S., Chen, W., Wattenhofer, R., Yu, Y.: Optimus: warming serverless ml inference via inter-function model transformation. In: Proceedings of the Nineteenth European Conference on Computer Systems, pp. 1039\u20131053 (2024)","DOI":"10.1145\/3627703.3629567"},{"key":"20_CR8","doi-asserted-by":"crossref","unstructured":"Hu, Y., et al.: Planning-oriented autonomous driving. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 17853\u201317862 (2023)","DOI":"10.1109\/CVPR52729.2023.01712"},{"issue":"9","key":"20_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3555802","volume":"55","author":"H Hua","year":"2023","unstructured":"Hua, H., Li, Y., Wang, T., Dong, N., Li, W., Cao, J.: Edge computing with artificial intelligence: a machine learning perspective. ACM Comput. Surv. 55(9), 1\u201335 (2023)","journal-title":"ACM Comput. Surv."},{"key":"20_CR10","doi-asserted-by":"crossref","unstructured":"Huang, Q., et al.: HDMixer: hierarchical dependency with extendable patch for multivariate time series forecasting. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 38, pp. 12608\u201312616 (2024)","DOI":"10.1609\/aaai.v38i11.29155"},{"key":"20_CR11","unstructured":"Huang, Q., et al.: CrossGNN: confronting noisy multivariate time series via cross interaction refinement. In: Advances in Neural Information Processing Systems, vol. 36 (2024)"},{"issue":"7","key":"20_CR12","doi-asserted-by":"publisher","first-page":"4000","DOI":"10.1109\/TMC.2022.3150432","volume":"22","author":"H Jiang","year":"2022","unstructured":"Jiang, H., Dai, X., Xiao, Z., Iyengar, A.: Joint task offloading and resource allocation for energy-constrained mobile edge computing. IEEE Trans. Mob. Comput. 22(7), 4000\u20134015 (2022)","journal-title":"IEEE Trans. Mob. Comput."},{"key":"20_CR13","doi-asserted-by":"crossref","unstructured":"Li, Y., Zeng, D., Gu, L., Ou, M., Chen, Q.: On efficient zygote container planning toward fast function startup in serverless edge cloud. In: IEEE INFOCOM 2023-IEEE Conference on Computer Communications, pp. 1\u20139. IEEE (2023)","DOI":"10.1109\/INFOCOM53939.2023.10228916"},{"issue":"12","key":"20_CR14","doi-asserted-by":"publisher","first-page":"15513","DOI":"10.1109\/TITS.2023.3249745","volume":"24","author":"L Liu","year":"2023","unstructured":"Liu, L., Feng, J., Mu, X., Pei, Q., Lan, D., Xiao, M.: Asynchronous deep reinforcement learning for collaborative task computing and on-demand resource allocation in vehicular edge computing. IEEE Trans. Intell. Transp. Syst. 24(12), 15513\u201315526 (2023)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"4","key":"20_CR15","doi-asserted-by":"publisher","first-page":"1186","DOI":"10.1109\/JSAC.2023.3242724","volume":"41","author":"Z Liu","year":"2023","unstructured":"Liu, Z., Lan, Q., Huang, K.: Resource allocation for multiuser edge inference with batching and early exiting. IEEE J. Sel. Areas Commun. 41(4), 1186\u20131200 (2023)","journal-title":"IEEE J. Sel. Areas Commun."},{"issue":"2","key":"20_CR16","first-page":"1586","volume":"23","author":"J Lou","year":"2024","unstructured":"Lou, J., Tang, Z., Jia, W., Zhao, W., Li, J.: Startup-aware dependent task scheduling with bandwidth constraints in edge computing. IEEE Trans. Mob. Comput. 23(2), 1586\u20131600 (2024)","journal-title":"IEEE Trans. Mob. Comput."},{"key":"20_CR17","doi-asserted-by":"crossref","unstructured":"Mohammed, T., Joe-Wong, C., Babbar, R., Di\u00a0Francesco, M.: Distributed inference acceleration with adaptive DNN partitioning and offloading. In: IEEE INFOCOM 2020-IEEE Conference on Computer Communications, pp. 854\u2013863. IEEE (2020)","DOI":"10.1109\/INFOCOM41043.2020.9155237"},{"key":"20_CR18","doi-asserted-by":"crossref","unstructured":"Russo, G.R., Mannucci, T., Cardellini, V., Presti, F.L.: Serverledge: decentralized function-as-a-service for the edge-cloud continuum. In: 2023 IEEE International Conference on Pervasive Computing and Communications (PerCom), pp. 131\u2013140. IEEE (2023)","DOI":"10.1109\/PERCOM56429.2023.10099372"},{"key":"20_CR19","doi-asserted-by":"crossref","unstructured":"Sethi, B., Addya, S.K., Ghosh, S.K.: LCS: alleviating total cold start latency in serverless applications with LRU warm container approach. In: Proceedings of the 24th International Conference on Distributed Computing and Networking, pp. 197\u2013206 (2023)","DOI":"10.1145\/3571306.3571404"},{"key":"20_CR20","unstructured":"Shahrad, M., et al.: Serverless in the wild: characterizing and optimizing the serverless workload at a large cloud provider. In: 2020 USENIX Annual Technical Conference (USENIX ATC 20), pp. 205\u2013218 (2020)"},{"key":"20_CR21","unstructured":"Shen, Y., Song, K., Tan, X., Li, D., Lu, W., Zhuang, Y.: HuggingGPT: solving AI tasks with ChatGPT and its friends in hugging face. In: Advances in Neural Information Processing Systems, vol. 36 (2024)"},{"issue":"12","key":"20_CR22","doi-asserted-by":"publisher","first-page":"13281","DOI":"10.1109\/TVT.2021.3121096","volume":"70","author":"H Tian","year":"2021","unstructured":"Tian, H., Xu, X., Qi, L., Zhang, X., Dou, W., Yu, S., Ni, Q.: CoPace: edge computation offloading and caching for self-driving with deep reinforcement learning. IEEE Trans. Veh. Technol. 70(12), 13281\u201313293 (2021)","journal-title":"IEEE Trans. Veh. Technol."},{"key":"20_CR23","doi-asserted-by":"crossref","unstructured":"Weng, Q., et al.: MLaaS in the wild: workload analysis and scheduling in large-scale heterogeneous GPU clusters. In: 19th $$\\{$$USENIX$$\\}$$ Symposium on Networked Systems Design and Implementation ($$\\{$$NSDI$$\\}$$ 22) (2022)","DOI":"10.21203\/rs.3.rs-2266264\/v1"},{"issue":"3","key":"20_CR24","doi-asserted-by":"publisher","first-page":"2093","DOI":"10.1109\/TMC.2023.3246462","volume":"23","author":"L Wu","year":"2024","unstructured":"Wu, L., Sun, P., Wang, Z., Li, Y., Yang, Y.: Computation offloading in multi-cell networks with collaborative edge-cloud computing: a game theoretic approach. IEEE Trans. Mob. Comput. 23(3), 2093\u20132106 (2024)","journal-title":"IEEE Trans. Mob. Comput."},{"issue":"9","key":"20_CR25","doi-asserted-by":"publisher","first-page":"8789","DOI":"10.1109\/TMC.2024.3355118","volume":"23","author":"K Xiao","year":"2024","unstructured":"Xiao, K., Yang, S., Li, F., Zhu, L., Chen, X., Fu, X.: Making serverless not so cold in edge clouds: a cost-effective online approach. IEEE Trans. Mob. Comput. 23(9), 8789\u20138802 (2024)","journal-title":"IEEE Trans. Mob. Comput."},{"issue":"3","key":"20_CR26","doi-asserted-by":"publisher","first-page":"1206","DOI":"10.1109\/TSC.2022.3142265","volume":"15","author":"X Xu","year":"2022","unstructured":"Xu, X., Tian, H., Zhang, X., Qi, L., He, Q., Dou, W.: DisCOV: distributed Covid-19 detection on X-ray images with edge-cloud collaboration. IEEE Trans. Serv. Comput. 15(3), 1206\u20131219 (2022)","journal-title":"IEEE Trans. Serv. Comput."},{"issue":"16","key":"20_CR27","doi-asserted-by":"publisher","first-page":"26741","DOI":"10.1109\/JIOT.2023.3288200","volume":"11","author":"H Yan","year":"2024","unstructured":"Yan, H., Li, H., Xu, X., Bilal, M.: UAV-enhanced service caching for IoT systems in extreme environments. IEEE Internet Things J. 11(16), 26741\u201326750 (2024)","journal-title":"IEEE Internet Things J."},{"key":"20_CR28","doi-asserted-by":"crossref","unstructured":"Yi, R., Cao, T., Zhou, A., Ma, X., Wang, S., Xu, M.: Boosting DNN cold inference on edge devices. In: Proceedings of the 21st Annual International Conference on Mobile Systems, Applications and Services, pp. 516\u2013529 (2023)","DOI":"10.1145\/3581791.3596842"},{"issue":"6","key":"20_CR29","doi-asserted-by":"publisher","first-page":"1118","DOI":"10.1109\/JSAC.2020.2986614","volume":"38","author":"W Zhang","year":"2020","unstructured":"Zhang, W., Zhang, Z., Zeadally, S., Chao, H.C., Leung, V.C.: Energy-efficient workload allocation and computation resource configuration in distributed cloud\/edge computing systems with stochastic workloads. IEEE J. Sel. Areas Commun. 38(6), 1118\u20131132 (2020)","journal-title":"IEEE J. Sel. Areas Commun."},{"issue":"3","key":"20_CR30","first-page":"2473","volume":"11","author":"H Zhao","year":"2024","unstructured":"Zhao, H., et al.: faaShark: an end-to-end network traffic analysis system atop serverless computing. IEEE Trans. Netw. Sci. Eng. 11(3), 2473\u20132484 (2024)","journal-title":"IEEE Trans. Netw. Sci. Eng."},{"issue":"8","key":"20_CR31","doi-asserted-by":"publisher","first-page":"8111","DOI":"10.1109\/TMC.2023.3348165","volume":"23","author":"K Zhao","year":"2024","unstructured":"Zhao, K., Zhou, Z., Jiao, L., Cai, S., Xu, F., Chen, X.: Taming serverless cold start of cloud model inference with edge computing. IEEE Trans. Mob. Comput. 23(8), 8111\u20138128 (2024)","journal-title":"IEEE Trans. Mob. Comput."},{"issue":"10","key":"20_CR32","doi-asserted-by":"publisher","first-page":"6144","DOI":"10.1109\/TMC.2022.3189050","volume":"22","author":"H Zhou","year":"2023","unstructured":"Zhou, H., Wu, T., Chen, X., He, S., Guo, D., Wu, J.: Reverse auction-based computation offloading and resource allocation in mobile cloud-edge computing. IEEE Trans. Mob. Comput. 22(10), 6144\u20136159 (2023)","journal-title":"IEEE Trans. Mob. Comput."},{"key":"20_CR33","doi-asserted-by":"crossref","unstructured":"Zhou, Y., et al.: MMRotate: a rotated object detection benchmark using PyTorch. In: Proceedings of the 30th ACM International Conference on Multimedia, pp. 7331\u20137334 (2022)","DOI":"10.1145\/3503161.3548541"}],"container-title":["Lecture Notes in Computer Science","Advanced Data Mining and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-0811-9_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T18:03:44Z","timestamp":1734026624000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-0811-9_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,13]]},"ISBN":["9789819608102","9789819608119"],"references-count":33,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-0811-9_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,12,13]]},"assertion":[{"value":"13 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ADMA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Data Mining and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Sydney, NSW","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Australia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3 December 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"5 December 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"adma2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/adma2024.github.io\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}