{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T09:38:48Z","timestamp":1775122728778,"version":"3.50.1"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,19]],"date-time":"2024-06-19T00:00:00Z","timestamp":1718755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,19]],"date-time":"2024-06-19T00:00:00Z","timestamp":1718755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,19]]},"DOI":"10.1109\/iwqos61813.2024.10682873","type":"proceedings-article","created":{"date-parts":[[2024,9,26]],"date-time":"2024-09-26T17:41:00Z","timestamp":1727372460000},"page":"1-10","source":"Crossref","is-referenced-by-count":2,"title":["Optimizing Inference Quality with SmartNIC for Recommendation System"],"prefix":"10.1109","author":[{"given":"Ruixin","family":"Shi","sequence":"first","affiliation":[{"name":"Fudan University"}]},{"given":"Ming","family":"Yan","sequence":"additional","affiliation":[{"name":"Fudan University"}]},{"given":"Jie","family":"Wu","sequence":"additional","affiliation":[{"name":"Fudan University"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3533727"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref3","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2019"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3523227.3546765"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE53745.2022.00324"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/BigData55660.2022.10021133"},{"key":"ref7","article-title":"Deep learning recommendation model for personalization and recommendation systems","author":"Naumov","year":"2019"},{"key":"ref8","article-title":"Criteo-kaggle dataset","year":"2014"},{"key":"ref9","article-title":"Disaggrec: Architecting disaggregated systems for large-scale personalized recommendation","author":"Ke","year":"2022"},{"key":"ref10","article-title":"Monolith: Real time recommendation system with collisionless embedding table","author":"Liu","year":"2022"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3523227.3546765"},{"key":"ref12","article-title":"Distributed hierarchical GPU parameter server for massive scale deep learning ads systems","volume-title":"Proceedings of Machine Learning and Systems 2020, MLSys 2020, Austin, TX, USA, March 2-4, 2020","author":"Zhao"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.14778\/3489496.3489511"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3523227.3547387"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3492321.3519554"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.14778\/3485450.3485462"},{"key":"ref17","article-title":"Nvidia bluefield dpu-2","year":"2022"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3577193.3593724"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2022.3189207"},{"key":"ref20","first-page":"967","article-title":"FpgaNIC: An FPGA-based versatile 100gb SmartNIC for GPUs","volume-title":"2022 USENIX Annual Technical Conference (USENIX ATC 22)","author":"Wang"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2021.3139027"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/HOTI52880.2021.00017"},{"key":"ref23","article-title":"A low-latency gpu memory copy library based on nvidia gpudirect rdma technology","year":"2023"},{"key":"ref24","article-title":"Developing a linux kernel module using gpudirect rdma","year":"2024"},{"key":"ref25","article-title":"Rdma over converged ethernet","year":"2018"},{"key":"ref26","article-title":"Criteo 1tb click logs dataset","year":"2018"},{"key":"ref27","article-title":"Click-through rate prediction","author":"Wang","year":"2014"},{"key":"ref28","article-title":"Deep learning recommendation model","year":"2019"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/2988450.2988454"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2017\/239"},{"key":"ref31","article-title":"Nvidia bluefield-3 dpu datasheet","year":"2023"},{"key":"ref32","article-title":"Doca gpunetio api document","year":"2023"}],"event":{"name":"2024 IEEE\/ACM 32nd International Symposium on Quality of Service (IWQoS)","location":"Guangzhou, China","start":{"date-parts":[[2024,6,19]]},"end":{"date-parts":[[2024,6,21]]}},"container-title":["2024 IEEE\/ACM 32nd International Symposium on Quality of Service (IWQoS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10682818\/10682608\/10682873.pdf?arnumber=10682873","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,27]],"date-time":"2024-09-27T04:39:48Z","timestamp":1727411988000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10682873\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,19]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/iwqos61813.2024.10682873","relation":{},"subject":[],"published":{"date-parts":[[2024,6,19]]}}}