{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T05:35:15Z","timestamp":1757568915914,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":35,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,25]],"date-time":"2023-10-25T00:00:00Z","timestamp":1698192000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,25]]},"DOI":"10.1145\/3639856.3639878","type":"proceedings-article","created":{"date-parts":[[2024,5,17]],"date-time":"2024-05-17T11:49:10Z","timestamp":1715946550000},"page":"1-9","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Hetero-Rec++: Modelling-based Robust and Optimal Deployment of Embeddings Recommendations"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8592-3132","authenticated-orcid":false,"given":"Ashwin","family":"Krishnan","sequence":"first","affiliation":[{"name":"TCS Research, IN"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9001-0629","authenticated-orcid":false,"given":"Manoj","family":"Nambiar","sequence":"additional","affiliation":[{"name":"TCS, IN"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3712-1784","authenticated-orcid":false,"given":"Rekha","family":"Singhal","sequence":"additional","affiliation":[{"name":"TCS, IN"}]}],"member":"320","published-online":{"date-parts":[[2024,5,17]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"[n.d.].. https:\/\/www.intel.com\/content\/www\/us\/en\/products\/sku\/120473\/intel-xeon-gold-5118-processor-16-5m-cache-2-30-ghz\/specifications.html"},{"key":"e_1_3_2_1_2_1","unstructured":"[n.d.]. CriteoLabs. Terabyte click logs. https:\/\/ailab.criteo.com\/download-criteo-1tb-click-logs-dataset\/"},{"key":"e_1_3_2_1_3_1","unstructured":"Xilinx Inc. 2017. Block Memory Generator v8.3. Xilinx Inc. https:\/\/docs.xilinx.com\/v\/u\/8.3-English\/pg058-blk-mem-gen"},{"key":"e_1_3_2_1_4_1","unstructured":"Xilinx Inc. 2021. UltraRAM Readback and Writeback v1.0. Xilinx Inc. https:\/\/www.xilinx.com\/content\/dam\/xilinx\/support\/documents\/ip_documentation\/uram_rd_back\/v1_0\/pg356-uram-rdback.pdf"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Muhammad Adnan Yassaman\u00a0Ebrahimzadeh Maboud Divya Mahajan and Prashant\u00a0J. Nair. 2021. Accelerating Recommendation System Training by Leveraging Popular Choices. arxiv:2103.00686\u00a0[cs.IR]","DOI":"10.14778\/3485450.3485462"},{"key":"e_1_3_2_1_6_1","unstructured":"Alimama. 2018. Ad Display\/Click Data on Taobao.com. https:\/\/tianchi.aliyun.com\/dataset\/dataDetail?dataId=56&lang=en-us"},{"key":"e_1_3_2_1_7_1","unstructured":"Xilinx Inc. 2021. Alveo u280 data center accelerator card. Xilinx Inc. https:\/\/www.xilinx.com\/products\/boards-and-kits\/alveo\/u280.html"},{"key":"e_1_3_2_1_8_1","unstructured":"Avazu. 2015. Avazu Dataset. https:\/\/www.kaggle.com\/c\/avazu-ctr-prediction"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCCN49398.2020.9209730"},{"key":"e_1_3_2_1_10_1","volume-title":"NISER: Normalized item and session representations to handle popularity bias. arXiv preprint arXiv:1909.04276","author":"Gupta Priyanka","year":"2019","unstructured":"Priyanka Gupta, Diksha Garg, Pankaj Malhotra, Lovekesh Vig, and Gautam Shroff. 2019. NISER: Normalized item and session representations to handle popularity bias. arXiv preprint arXiv:1909.04276 (2019)."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00084"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480127"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","unstructured":"Samuel Hsia Udit Gupta Mark Wilkening Carole-Jean Wu Gu-Yeon Wei and David Brooks. 2020. Cross-Stack Workload Characterization of Deep Recommendation Systems. https:\/\/doi.org\/10.48550\/ARXIV.2010.05037","DOI":"10.48550\/ARXIV.2010.05037"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00083"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3488423.3519317"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589112"},{"key":"e_1_3_2_1_17_1","unstructured":"Wenqi Jiang Zhenhao He Shuai Zhang Thomas\u00a0B. Preu\u00dfer Kai Zeng Liang Feng Jiansong Zhang Tongxuan Liu Yong Li Jingren Zhou Ce Zhang and Gustavo Alonso. 2021. MicroRec: Efficient Recommendation Inference by Hardware and Data Structure Solutions. arxiv:2010.05894\u00a0[cs.AR]"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467139"},{"key":"e_1_3_2_1_19_1","volume-title":"Hercules: Heterogeneity-Aware Inference Serving for At-Scale Personalized Recommendation. arxiv:2203.07424\u00a0[cs.DC]","author":"Ke Liu","year":"2022","unstructured":"Liu Ke, Udit Gupta, Mark Hempstead, Carole-Jean Wu, Hsien-Hsin\u00a0S. Lee, and Xuan Zhang. 2022. Hercules: Heterogeneity-Aware Inference Serving for At-Scale Personalized Recommendation. arxiv:2203.07424\u00a0[cs.DC]"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3401071.3401659"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3489525.3511692"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2017.10.047"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358284"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3564121.3564134"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.14778\/3421424.3421425"},{"key":"e_1_3_2_1_26_1","volume-title":"Deep learning recommendation model for personalization and recommendation systems. arXiv preprint arXiv:1906.00091","author":"Naumov Maxim","year":"2019","unstructured":"Maxim Naumov, Dheevatsa Mudigere, Hao-Jun\u00a0Michael Shi, Jianyu Huang, Narayanan Sundaraman, Jongsoo Park, Xiaodong Wang, Udit Gupta, Carole-Jean Wu, Alisson\u00a0G Azzolini, 2019. Deep learning recommendation model for personalization and recommendation systems. arXiv preprint arXiv:1906.00091 (2019)."},{"volume-title":"PyTorch: An Imperative Style","author":"Paszke Adam","key":"e_1_3_2_1_27_1","unstructured":"Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. 2019. PyTorch: An Imperative Style, High-Performance Deep Learning Library. In Advances in Neural Information Processing Systems 32, H.\u00a0Wallach, H.\u00a0Larochelle, A.\u00a0Beygelzimer, F.\u00a0d'Alch\u00e9-Buc, E.\u00a0Fox, and R.\u00a0Garnett (Eds.). Curran Associates, Inc., 8024\u20138035. http:\/\/papers.neurips.cc\/paper\/9015-pytorch-an-imperative-style-high-performance-deep-learning-library.pdf"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","unstructured":"Geet Sethi Bilge Acun Niket Agarwal Christos Kozyrakis Caroline Trippel and Carole-Jean Wu. 2022. RecShard: Statistical Feature-Based Memory Optimization for Industry-Scale Neural Recommendation. https:\/\/doi.org\/10.48550\/ARXIV.2201.10095","DOI":"10.48550\/ARXIV.2201.10095"},{"key":"e_1_3_2_1_29_1","volume-title":"Accessed","author":"Wikipedia","year":"2021","unstructured":"Wikipedia contributors. 2021. Linear Interpolation. https:\/\/en.wikipedia.org\/wiki\/Linear_interpolation. Accessed September 23, 2023."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3445814.3446763"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.3301346"},{"key":"e_1_3_2_1_32_1","unstructured":"Inc. Xilinx. 2019. Xilinx QDMA DPDK Poll Mode Driver. https:\/\/xilinx.github.io\/dma_ip_drivers\/2019.1\/DPDK\/html\/index.html"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","unstructured":"Guorui Zhou Kun Gai Xiaoqiang Zhu Chenru Song Ying Fan Han Zhu Xiao Ma Yanghui Yan Junqi Jin and Han Li. 2018. Deep Interest Network for Click-Through Rate Prediction. 1059\u20131068. https:\/\/doi.org\/10.1145\/3219819.3219823","DOI":"10.1145\/3219819.3219823"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33015941"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/FPL53798.2021.00057"}],"event":{"name":"AIMLSystems 2023: The Third International Conference on Artificial Intelligence and Machine Learning Systems","acronym":"AIMLSystems 2023","location":"Bangalore India"},"container-title":["The Third International Conference on Artificial Intelligence and Machine Learning Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3639856.3639878","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3639856.3639878","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T17:00:28Z","timestamp":1755882028000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3639856.3639878"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,25]]},"references-count":35,"alternative-id":["10.1145\/3639856.3639878","10.1145\/3639856"],"URL":"https:\/\/doi.org\/10.1145\/3639856.3639878","relation":{},"subject":[],"published":{"date-parts":[[2023,10,25]]},"assertion":[{"value":"2024-05-17","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}