{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,6]],"date-time":"2026-06-06T01:09:03Z","timestamp":1780708143165,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":44,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,6,21]],"date-time":"2023-06-21T00:00:00Z","timestamp":1687305600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,6,21]]},"DOI":"10.1145\/3577193.3593724","type":"proceedings-article","created":{"date-parts":[[2023,6,20]],"date-time":"2023-06-20T18:47:05Z","timestamp":1687286825000},"page":"336-347","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":21,"title":["Software-Hardware Co-design of Heterogeneous SmartNIC System for Recommendation Models Inference and Training"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5872-4464","authenticated-orcid":false,"given":"Anqi","family":"Guo","sequence":"first","affiliation":[{"name":"Boston University, Boston, USA"},{"name":"University of Rochester, Rochester, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8513-9566","authenticated-orcid":false,"given":"Yuchen","family":"Hao","sequence":"additional","affiliation":[{"name":"Meta Platforms, San Francisco, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-2039-0853","authenticated-orcid":false,"given":"Chunshu","family":"Wu","sequence":"additional","affiliation":[{"name":"Boston University, Boston, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2893-9194","authenticated-orcid":false,"given":"Pouya","family":"Haghi","sequence":"additional","affiliation":[{"name":"Boston University, Boston, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-2805-6018","authenticated-orcid":false,"given":"Zhenyu","family":"Pan","sequence":"additional","affiliation":[{"name":"University of Rochester, Rochester, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0208-096X","authenticated-orcid":false,"given":"Min","family":"Si","sequence":"additional","affiliation":[{"name":"Meta Platforms, San Francisco, United States of America"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5422-4497","authenticated-orcid":false,"given":"Dingwen","family":"Tao","sequence":"additional","affiliation":[{"name":"Indiana University, Bloomington, United States of America"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3734-9137","authenticated-orcid":false,"given":"Ang","family":"Li","sequence":"additional","affiliation":[{"name":"Pacific Northwest National Laboratory, Richland, United States of America"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3443-9113","authenticated-orcid":false,"given":"Martin","family":"Herbordt","sequence":"additional","affiliation":[{"name":"Boston University, Boston, United States of America"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3644-2922","authenticated-orcid":false,"given":"Tong","family":"Geng","sequence":"additional","affiliation":[{"name":"University of Rochester, Rochester, United States of America"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2023,6,21]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1603.04467"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3506713"},{"key":"e_1_3_2_1_3_1","unstructured":"Broadcom. 2019. Stingray PS250 2x50-Gb High-Performance Data Center Smart-NIC. https:\/\/docs.broadcom.com\/doc\/PS250-PB  Broadcom. 2019. Stingray PS250 2x50-Gb High-Performance Data Center Smart-NIC. https:\/\/docs.broadcom.com\/doc\/PS250-PB"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2016.7783710"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2959100.2959190"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1811.05922"},{"key":"e_1_3_2_1_7_1","unstructured":"facebookresearch. 2019. Deep Learning Recommendation Model for Personalization and Recommendation Systems. https:\/\/github.com\/facebookresearch\/dlrm  facebookresearch. 2019. Deep Learning Recommendation Model for Personalization and Recommendation Systems. https:\/\/github.com\/facebookresearch\/dlrm"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2843948"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/FCCM53951.2022.9786193"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/FPL57034.2022.00071"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1906.03109"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1002\/cpe.6769"},{"key":"e_1_3_2_1_13_1","volume-title":"FLASH: FPGA-Accelerated Smart Switches with GCN Case Study. In ICS 2023: International Conference on Supercomputing.","author":"Haghi P.","unstructured":"P. Haghi , W. Krska , C. Tan , T. Geng , P.H. Chen , C. Greenwood , A. Guo , T. Hines , C. Wu , A. Li , A. Skjellum , and M.C. Herbordt . 2023 . FLASH: FPGA-Accelerated Smart Switches with GCN Case Study. In ICS 2023: International Conference on Supercomputing. P. Haghi, W. Krska, C. Tan, T. Geng, P.H. Chen, C. Greenwood, A. Guo, T. Hines, C. Wu, A. Li, A. Skjellum, and M.C. Herbordt. 2023. FLASH: FPGA-Accelerated Smart Switches with GCN Case Study. In ICS 2023: International Conference on Supercomputing."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2018.00059"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3126908.3126970"},{"key":"e_1_3_2_1_16_1","unstructured":"Intel. 2021. Intel\u00ae Infrastructure Processing Unit (Intel\u00ae IPU). https:\/\/www.intel.com\/content\/www\/us\/en\/products\/network-io\/smartnic.html  Intel. 2021. Intel\u00ae Infrastructure Processing Unit (Intel\u00ae IPU). https:\/\/www.intel.com\/content\/www\/us\/en\/products\/network-io\/smartnic.html"},{"key":"e_1_3_2_1_17_1","unstructured":"Intel. 2022. Intel\u00ae FPGA SmartNIC. https:\/\/www.intel.com\/content\/www\/us\/en\/products\/details\/fpga\/platforms\/smartnic.html  Intel. 2022. Intel\u00ae FPGA SmartNIC. https:\/\/www.intel.com\/content\/www\/us\/en\/products\/details\/fpga\/platforms\/smartnic.html"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/FPGA.2003.1227273"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2010.05894"},{"key":"e_1_3_2_1_20_1","unstructured":"Jie. 2020. Training Deep Learning Recommendation Model with Quantized Collective Communications.  Jie. 2020. Training Deep Learning Recommendation Model with Quantized Collective Communications."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/HOTI51249.2020.00018"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527386"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1909.11942"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1802.07389"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1712.01887"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3533727"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2003.09518"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1906.00091"},{"key":"e_1_3_2_1_29_1","unstructured":"Nvidia. 2021. NVIDIA BLUEFIELD-2 DPU. https:\/\/www.nvidia.com\/content\/dam\/en-zz\/Solutions\/Data-Center\/documents\/datasheet-nvidia-bluefield-2-dpu.pdf  Nvidia. 2021. NVIDIA BLUEFIELD-2 DPU. https:\/\/www.nvidia.com\/content\/dam\/en-zz\/Solutions\/Data-Center\/documents\/datasheet-nvidia-bluefield-2-dpu.pdf"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1811.09886"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3295500.3356153"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1802.05799"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503222.3507777"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC49654.2021.9622807"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403059"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/MIC.2017.72"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.0902.2206"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3445814.3446763"},{"key":"e_1_3_2_1_39_1","unstructured":"Xilinx. 2020. Alveo U25 SmartNIC Accelerator Card. https:\/\/www.xilinx.com\/products\/boards-and-kits\/alveo\/u25.html  Xilinx. 2020. Alveo U25 SmartNIC Accelerator Card. https:\/\/www.xilinx.com\/products\/boards-and-kits\/alveo\/u25.html"},{"key":"e_1_3_2_1_40_1","unstructured":"Xilinx. 2022. The Industry's First SmartNIC With Composable Hardware. https:\/\/www.xilinx.com\/applications\/data-center\/network-acceleration\/alveo-sn1000.html  Xilinx. 2022. The Industry's First SmartNIC With Composable Hardware. https:\/\/www.xilinx.com\/applications\/data-center\/network-acceleration\/alveo-sn1000.html"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2010.11305"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2101.11714"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2003.05622"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/FPL53798.2021.00057"}],"event":{"name":"ICS '23: 37th International Conference on Supercomputing","location":"Orlando FL USA","acronym":"ICS '23","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 37th International Conference on Supercomputing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3577193.3593724","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:47:32Z","timestamp":1750178852000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3577193.3593724"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,21]]},"references-count":44,"alternative-id":["10.1145\/3577193.3593724","10.1145\/3577193"],"URL":"https:\/\/doi.org\/10.1145\/3577193.3593724","relation":{},"subject":[],"published":{"date-parts":[[2023,6,21]]},"assertion":[{"value":"2023-06-21","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}