{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T17:33:18Z","timestamp":1778347998838,"version":"3.51.4"},"reference-count":58,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"9","license":[{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Research Grants Council of Hong Kong","award":["11202623"],"award-info":[{"award-number":["11202623"]}]},{"name":"CityU SRG-Fd","award":["7005658"],"award-info":[{"award-number":["7005658"]}]},{"DOI":"10.13039\/100019527","name":"Aromatic Plant Research Center","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100019527","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100007567","name":"City University of Hong Kong","doi-asserted-by":"publisher","award":["9610633"],"award-info":[{"award-number":["9610633"]}],"id":[{"id":"10.13039\/100007567","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Mobile Comput."],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1109\/tmc.2024.3355764","type":"journal-article","created":{"date-parts":[[2024,1,18]],"date-time":"2024-01-18T18:39:18Z","timestamp":1705603158000},"page":"8935-8950","source":"Crossref","is-referenced-by-count":17,"title":["SwapNet: Efficient Swapping for DNN Inference on Edge AI Devices Beyond the Memory Budget"],"prefix":"10.1109","volume":"23","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0149-9857","authenticated-orcid":false,"given":"Kun","family":"Wang","sequence":"first","affiliation":[{"name":"Department of Computer Science, City University of Hong Kong, Hong Kong, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8211-3564","authenticated-orcid":false,"given":"Jiani","family":"Cao","sequence":"additional","affiliation":[{"name":"Department of Computer Science, City University of Hong Kong, Hong Kong, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5457-6967","authenticated-orcid":false,"given":"Zimu","family":"Zhou","sequence":"additional","affiliation":[{"name":"School of Data Science, City University of Hong Kong, Hong Kong, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3296-3392","authenticated-orcid":false,"given":"Zhenjiang","family":"Li","sequence":"additional","affiliation":[{"name":"Department of Computer Science, City University of Hong Kong, Hong Kong, China"}]}],"member":"263","reference":[{"key":"ref1","article-title":"NVIDIA Jetson\n      modules","year":"2014"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref3","article-title":"Very deep\n      convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref5","article-title":"YOLOV3: An\n      incremental improvement","author":"Redmon","year":"2018"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/RTAS.2019.00033"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18072.2020.9218618"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/MRA.2006.1638022"},{"key":"ref9","article-title":"RosMaster\n      X3","year":"2022"},{"key":"ref10","first-page":"138","article-title":"Deep\n      compression: Compressing deep neural networks with pruning, trained quantization and Huffman\n      coding","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Han"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3210240.3210337"},{"key":"ref12","first-page":"222","article-title":"mGEMM:\n      Low-latency convolution with minimal memory overhead optimized for mobile\n      devices","volume-title":"Proc. 20th Annu. Int. Conf. Mobile Syst. Appl.\n      Serv.","author":"Park"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3300061.3345448"},{"key":"ref14","first-page":"186","article-title":"NeuLens:\n      Spatial-based dynamic acceleration of convolutional neural networks on\n     edge","volume-title":"Proc. 28th Annu. Int. Conf. Mobile Comput.\n      Netw.","author":"Hou"},{"key":"ref15","article-title":"Model\n      compression via distillation and quantization","author":"Polino","year":"2018"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-05318-5_3"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037698"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3560905.3568531"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3495243.3560551"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3300061.3345447"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2946140"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3478073"},{"key":"ref23","article-title":"TensorFlow-Lite","year":"2023"},{"key":"ref24","article-title":"MACE","year":"2022"},{"key":"ref25","article-title":"NCNN","year":"2023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3447993.3448625"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3498361.3538932"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3498361.3538948"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3498361.3538928"},{"key":"ref30","article-title":"CUDA toolkit\n      documentation","year":"2023"},{"key":"ref31","article-title":"Torch-Pruning-2022","year":"2022"},{"key":"ref32","article-title":"PyTorch","year":"2023"},{"key":"ref33","article-title":"llama-2","year":"2023"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.3390\/s19092048"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3485730.3485937"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2761740"},{"key":"ref37","article-title":"Opencl","year":"2009"},{"key":"ref38","article-title":"Metal","year":"2014"},{"key":"ref39","article-title":"Vulkan","year":"2016"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3409963.3410493"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysarc.2019.01.011"},{"key":"ref42","article-title":"PyTorch dispatcher\n      mechanism","year":"2023"},{"key":"ref43","article-title":"Unified memory in\n      CUDA","year":"2013"},{"key":"ref44","first-page":"265","article-title":"TensorFlow: A system for large-scale machine\n      learning","volume-title":"Proc. 12th USENIX Conf. Operating Syst. Des.\n      Implementation","author":"Abadi"},{"key":"ref45","article-title":"MNN","year":"2023"},{"key":"ref47","article-title":"Linux DMAEngine documentation","year":"2023"},{"key":"ref48","article-title":"NVIDIA CUDA\n      compiler driver NVCC","year":"2023"},{"key":"ref49","article-title":"NVIDIA visual\n      profiler","year":"2022"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.08.144"},{"key":"ref51","article-title":"INA3221\n      power monitor","year":"2016"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1145\/3448125"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/3384419.3430898"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/3560905.3568520"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/3485730.3485938"},{"key":"ref56","article-title":"Enabling large\n      neural networks on tiny microcontrollers with swapping","author":"Miao","year":"2021"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378530"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3222509"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"}],"container-title":["IEEE Transactions on Mobile Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7755\/10627925\/10403957.pdf?arnumber=10403957","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,7]],"date-time":"2024-08-07T18:04:48Z","timestamp":1723053888000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10403957\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9]]},"references-count":58,"journal-issue":{"issue":"9"},"URL":"https:\/\/doi.org\/10.1109\/tmc.2024.3355764","relation":{},"ISSN":["1536-1233","1558-0660","2161-9875"],"issn-type":[{"value":"1536-1233","type":"print"},{"value":"1558-0660","type":"electronic"},{"value":"2161-9875","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9]]}}}