{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T10:13:28Z","timestamp":1767262408851,"version":"3.37.3"},"reference-count":58,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2021,7,1]],"date-time":"2021-07-01T00:00:00Z","timestamp":1625097600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,7,1]],"date-time":"2021-07-01T00:00:00Z","timestamp":1625097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,7,1]],"date-time":"2021-07-01T00:00:00Z","timestamp":1625097600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2018YFB1004401"],"award-info":[{"award-number":["2018YFB1004401"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61802412","61732014","61972403","62072459","U1911203"],"award-info":[{"award-number":["61802412","61732014","61972403","62072459","U1911203"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"State Key Laboratory of Computer Architecture","award":["CARCHA202007"],"award-info":[{"award-number":["CARCHA202007"]}]},{"name":"MoE AcRF Tier 1","award":["T1 251RES1824"],"award-info":[{"award-number":["T1 251RES1824"]}]},{"name":"Tier 2","award":["MOE2017-T2-1-122"],"award-info":[{"award-number":["MOE2017-T2-1-122"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Parallel Distrib. Syst."],"published-print":{"date-parts":[[2021,7,1]]},"DOI":"10.1109\/tpds.2020.3046870","type":"journal-article","created":{"date-parts":[[2020,12,23]],"date-time":"2020-12-23T20:24:10Z","timestamp":1608755050000},"page":"1740-1752","source":"Crossref","is-referenced-by-count":23,"title":["iMLBench: A Machine Learning Benchmark Suite for CPU-GPU Integrated Architectures"],"prefix":"10.1109","volume":"32","author":[{"given":"Chenyang","family":"Zhang","sequence":"first","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1983-7321","authenticated-orcid":false,"given":"Feng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"}]},{"given":"Xiaoguang","family":"Guo","sequence":"additional","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"}]},{"given":"Bingsheng","family":"He","sequence":"additional","affiliation":[{"name":"School of Computing, National University of Singapore, Singapore"}]},{"given":"Xiao","family":"Zhang","sequence":"additional","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"}]},{"given":"Xiaoyong","family":"Du","sequence":"additional","affiliation":[{"name":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2016.7577314"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/FPT.2016.7929192"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2019.2940184"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CGO.2017.7863726"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2017.42"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2015.71"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/1735688.1735702"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/1454115.1454152"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CogMI48466.2019.00029"},{"year":"2019","key":"ref34"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2020.2980549"},{"key":"ref27","first-page":"83","article-title":"APUNet: Revitalizing GPU as packet processing accelerator","author":"go","year":"2017","journal-title":"Proc 14th USENIX Conf Netw Syst Des Implementation"},{"year":"2020","key":"ref29"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2016.24"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s11704-018-7386-4"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2020.2975652"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2015.144"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3225058.3225077"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2017.120"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2012.16"},{"year":"0","key":"ref26"},{"key":"ref25","first-page":"633","article-title":"FineStream: Fine-grained window-based stream processing on CPU-GPU integrated architectures","author":"zhang","year":"2020","journal-title":"Proc USENIX Annu Tech Conf"},{"key":"ref50","first-page":"605","article-title":"Application of k-nearest neighbor (KNN) approach for predicting economic events: Theoretical background","volume":"3","author":"imandoust","year":"2013","journal-title":"Int J Eng Res Appl"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevA.94.022342"},{"key":"ref58","article-title":"Is FPGA useful for hash joins?","author":"chen","year":"2020","journal-title":"Proc Annu Conf Innovative Data Syst Res"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2007.56"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2016.7482093"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1145\/3332466.3374520"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.435"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1007\/s41019-020-00123-3"},{"year":"2020","key":"ref52"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.2974843"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.14778\/3231751.3231770"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/4434.708248"},{"year":"2012","key":"ref12"},{"key":"ref13","first-page":"347","article-title":"HeteroSpark: A heterogeneous CPU\/GPU spark platform for machine learning algorithms","author":"li","year":"2015","journal-title":"Proc IEEE Int Conf Netw Archit Storage"},{"year":"2018","key":"ref14"},{"year":"2018","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2019.2932066"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/2597652.2597658"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3158643"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ASE.2017.8115687"},{"key":"ref4","first-page":"1","article-title":"NVIDIA&#x2019;S tegra K1 system-on-chip","author":"ditty","year":"2014","journal-title":"Proc HOT Chip Symp"},{"year":"2014","key":"ref3","article-title":"The compute architecture of Intel processor graphics Gen7.5"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2009.5306797"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2016.2586074"},{"key":"ref8","article-title":"Parboil: A revised benchmark suite for scientific and commercial throughput computing","author":"stratton","year":"2012","journal-title":"Center for Reliable and High-Performance Computing"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/1454115.1454128"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/ICOIN.2019.8717981"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1186\/s13040-017-0154-4"},{"year":"2017","key":"ref46"},{"year":"2018","key":"ref45"},{"article-title":"Deep500&#x2013;A deep learning meta-framework and HPC benchmark","year":"2018","author":"huber","key":"ref48"},{"key":"ref47","first-page":"3","article-title":"AIBench: Towards scalable and comprehensive datacenter AI benchmarking","author":"gao","year":"2018","journal-title":"Proc Int Symp Benchmarking Measuring Optim"},{"article-title":"A survey of model compression and acceleration for deep neural networks","year":"2017","author":"cheng","key":"ref42"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/SAAHPC.2011.29"},{"article-title":"PolyBench: The polyhedral benchmark suite","year":"2012","author":"pouchet","key":"ref44"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1145\/1815961.1815998"}],"container-title":["IEEE Transactions on Parallel and Distributed Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/71\/9357351\/09305972.pdf?arnumber=9305972","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T20:19:55Z","timestamp":1736972395000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9305972\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,1]]},"references-count":58,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tpds.2020.3046870","relation":{},"ISSN":["1045-9219","1558-2183","2161-9883"],"issn-type":[{"type":"print","value":"1045-9219"},{"type":"electronic","value":"1558-2183"},{"type":"electronic","value":"2161-9883"}],"subject":[],"published":{"date-parts":[[2021,7,1]]}}}