{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T10:08:40Z","timestamp":1775815720589,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":44,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,8,14]],"date-time":"2022-08-14T00:00:00Z","timestamp":1660435200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,8,14]]},"DOI":"10.1145\/3534678.3539164","type":"proceedings-article","created":{"date-parts":[[2022,8,12]],"date-time":"2022-08-12T19:06:12Z","timestamp":1660331172000},"page":"3495-3503","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":22,"title":["Semantic Retrieval at Walmart"],"prefix":"10.1145","author":[{"given":"Alessandro","family":"Magnani","sequence":"first","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]},{"given":"Feng","family":"Liu","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]},{"given":"Suthee","family":"Chaidaroon","sequence":"additional","affiliation":[{"name":"Santa Clara University, Santa Clara, CA, USA"}]},{"given":"Sachin","family":"Yadav","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Bangalore, India"}]},{"given":"Praveen","family":"Reddy Suram","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Bangalore, India"}]},{"given":"Ajit","family":"Puthenputhussery","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]},{"given":"Sijie","family":"Chen","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]},{"given":"Min","family":"Xie","sequence":"additional","affiliation":[{"name":"Instacart, Santa Clara, CA, USA"}]},{"given":"Anirudh","family":"Kashi","sequence":"additional","affiliation":[{"name":"University of Southern California, Los Angeles, CA, USA"}]},{"given":"Tony","family":"Lee","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]},{"given":"Ciya","family":"Liao","sequence":"additional","affiliation":[{"name":"Walmart Global Technology, Sunnyvale, CA, USA"}]}],"member":"320","published-online":{"date-parts":[[2022,8,14]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"The inverted multi-index","author":"Babenko Artem","year":"2014","unstructured":"Artem Babenko and Victor Lempitsky. 2014. The inverted multi-index. IEEE transactions on pattern analysis and machine intelligence 37, 6 (2014), 1247--1260."},{"key":"e_1_3_2_1_2_1","volume-title":"The Customer And Shopping Cart To Build A Three Fold Recommendation System. arXiv preprint arXiv:1705.06338","author":"Behera Bibek","year":"2017","unstructured":"Bibek Behera, Manoj Joshi, Abhilash KK, and Mohammad Ansari Ismail. 2017. Distributed Vector Representation Of Shopping Items, The Customer And Shopping Cart To Build A Three Fold Recommendation System. arXiv preprint arXiv:1705.06338 (2017)."},{"key":"e_1_3_2_1_3_1","unstructured":"Eliot Brenner Jun Zhao Aliasgar Kutiyanawala and Zheng Yan. 2018. Endto-End Neural Ranking for eCommerce Product Search: an application of task models and textual embeddings. In eCom."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1142\/S0218001493000339"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.14778\/2556549.2556562"},{"key":"e_1_3_2_1_6_1","first-page":"689","article-title":"Personalized Search: Potential and Pitfalls","volume":"2016","author":"Dumais Susan T.","year":"2016","unstructured":"Susan T. Dumais. 2016. Personalized Search: Potential and Pitfalls. In CIKM, 2016. 689.","journal-title":"CIKM"},{"key":"e_1_3_2_1_7_1","volume-title":"SPLADE: Sparse lexical and expansion model for first stage ranking. In SIGIR. 2288--2292.","author":"Formal Thibault","year":"2021","unstructured":"Thibault Formal, Benjamin Piwowarski, and St\u00e9phane Clinchant. 2021. SPLADE: Sparse lexical and expansion model for first stage ranking. In SIGIR. 2288--2292."},{"key":"e_1_3_2_1_8_1","volume-title":"Modularized transfomer-based ranking framework. arXiv preprint arXiv:2004.13313","author":"Gao Luyu","year":"2020","unstructured":"Luyu Gao, Zhuyun Dai, and Jamie Callan. 2020. Modularized transfomer-based ranking framework. arXiv preprint arXiv:2004.13313 (2020)."},{"key":"e_1_3_2_1_9_1","volume-title":"COIL: Revisit Exact Lexical Match in Information Retrieval with Contextualized Inverted List. arXiv preprint arXiv:2104.07186","author":"Gao Luyu","year":"2021","unstructured":"Luyu Gao, Zhuyun Dai, and Jamie Callan. 2021. COIL: Revisit Exact Lexical Match in Information Retrieval with Contextualized Inverted List. arXiv preprint arXiv:2104.07186 (2021)."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-72113-8_10"},{"key":"e_1_3_2_1_11_1","volume-title":"Realm: Retrieval-augmented language model pre-training. arXiv preprint arXiv:2002.08909","author":"Guu Kelvin","year":"2020","unstructured":"Kelvin Guu, Kenton Lee, Zora Tung, Panupong Pasupat, and Ming-Wei Chang. 2020. Realm: Retrieval-augmented language model pre-training. arXiv preprint arXiv:2002.08909 (2020)."},{"key":"e_1_3_2_1_12_1","unstructured":"Kaiming He Haoqi Fan Yuxin Wu Saining Xie and Ross Girshick. 2020. Momentum contrast for unsupervised visual representation learning. In CVPR. 9729-- 9738."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403305"},{"key":"e_1_3_2_1_14_1","first-page":"2333","article-title":"Learning deep structured semantic models for web search using clickthrough data","volume":"2013","author":"Huang Po-Sen","year":"2013","unstructured":"Po-Sen Huang, Xiaodong He, Jianfeng Gao, Li Deng, Alex Acero, and Larry P. Heck. 2013. Learning deep structured semantic models for web search using clickthrough data. In CIKM, 2013. 2333--2338.","journal-title":"CIKM"},{"key":"e_1_3_2_1_15_1","volume-title":"Poly-encoders: Transformer architectures and pre-training strategies for fast and accurate multi-sentence scoring. arXiv preprint arXiv:1905.01969","author":"Humeau Samuel","year":"2019","unstructured":"Samuel Humeau, Kurt Shuster, Marie-Anne Lachaux, and Jason Weston. 2019. Poly-encoders: Transformer architectures and pre-training strategies for fast and accurate multi-sentence scoring. arXiv preprint arXiv:1905.01969 (2019)."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"crossref","unstructured":"Thorsten Joachims. 1998. Text categorization with support vector machines: Learning with many relevant features. In ECML. 137--142.","DOI":"10.1007\/BFb0026683"},{"key":"e_1_3_2_1_17_1","unstructured":"Thorsten Joachims et al. 2003. Evaluating Retrieval Performance Using Clickthrough Data."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3077136.3080838"},{"key":"e_1_3_2_1_19_1","volume-title":"Dense passage retrieval for opendomain question answering. arXiv preprint arXiv:2004.04906","author":"Karpukhin Vladimir","year":"2020","unstructured":"Vladimir Karpukhin, Sewon Min, Patrick Lewis, Ledell Wu, Sergey Edunov, Danqi Chen, and Wen-tau Yih. 2020. Dense passage retrieval for opendomain question answering. arXiv preprint arXiv:2004.04906 (2020)."},{"key":"e_1_3_2_1_20_1","volume-title":"Colbert: Efficient and effective passage search via contextualized late interaction over bert. In SIGIR. 39--48.","author":"Khattab Omar","year":"2020","unstructured":"Omar Khattab and Matei Zaharia. 2020. Colbert: Efficient and effective passage search via contextualized late interaction over bert. In SIGIR. 39--48."},{"key":"e_1_3_2_1_21_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","author":"Kingma Diederik P","year":"2014","unstructured":"Diederik P Kingma and Jimmy Ba. 2014. Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467127"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00369"},{"key":"e_1_3_2_1_24_1","volume-title":"Raffaele Perego, Nicola Tonellotto, Nazli Goharian, and Ophir Frieder.","author":"MacAvaney Sean","year":"2020","unstructured":"Sean MacAvaney, Franco Maria Nardini, Raffaele Perego, Nicola Tonellotto, Nazli Goharian, and Ophir Frieder. 2020. Efficient document re-ranking for transformers by precomputing term representations. In SIGIR. 49--58."},{"key":"e_1_3_2_1_25_1","volume-title":"Introduction to information retrieval","author":"Manning Christopher D.","unstructured":"Christopher D. Manning, Prabhakar Raghavan, and Hinrich Sch\u00fctze. 2008. Introduction to information retrieval. Cambridge University Press."},{"key":"e_1_3_2_1_26_1","volume-title":"Efficient Estimation of Word Representations in Vector Space. CoRR abs\/1301.3781","author":"Mikolov Tomas","year":"2013","unstructured":"Tomas Mikolov, Kai Chen, Greg Corrado, and Jeffrey Dean. 2013. Efficient Estimation of Word Representations in Vector Space. CoRR abs\/1301.3781 (2013)."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1561\/1500000061"},{"key":"e_1_3_2_1_28_1","volume-title":"XtremeDistil: Multi-stage distillation for massive multilingual models. arXiv preprint arXiv:2004.05686","author":"Mukherjee Subhabrata","year":"2020","unstructured":"Subhabrata Mukherjee and Ahmed Awadallah. 2020. XtremeDistil: Multi-stage distillation for massive multilingual models. arXiv preprint arXiv:2004.05686 (2020)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330759"},{"key":"e_1_3_2_1_30_1","volume-title":"PyTorch: An Imperative Style","author":"Paszke Adam","unstructured":"Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. 2019. PyTorch: An Imperative Style, High-Performance Deep Learning Library. In Advances in Neural Information Processing Systems 32, H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00e9-Buc, E. Fox, and R. Garnett (Eds.). Curran Associates, Inc., 8024--8035. http:\/\/papers.neurips.cc\/paper\/9015-pytorchan-imperative-style-high-performance-deep-learning-library.pdf"},{"key":"e_1_3_2_1_31_1","volume-title":"Daxiang Dong, Hua Wu, and Haifeng Wang.","author":"Qu Yingqi","year":"2021","unstructured":"Yingqi Qu, Yuchen Ding, Jing Liu, Kai Liu, Ruiyang Ren, Wayne Xin Zhao, Daxiang Dong, Hua Wu, and Haifeng Wang. 2021. RocketQA: An optimized training approach to dense passage retrieval for open-domain question answering. In NAACL-HLT."},{"key":"e_1_3_2_1_32_1","volume-title":"SIGIR Workshop on eCommerce","author":"Sarvi Fatemeh","year":"2020","unstructured":"Fatemeh Sarvi, Nikos Voskarides, Lois Mooiman, Sebastian Schelter, and Maarten de Rijke. 2020. A Comparison of Supervised Learning to Match Methods for Product Search. SIGIR Workshop on eCommerce (2020)."},{"key":"e_1_3_2_1_33_1","first-page":"101","article-title":"A Latent Semantic Model with Convolutional-Pooling Structure for Information Retrieval","volume":"2014","author":"Shen Yelong","year":"2014","unstructured":"Yelong Shen, Xiaodong He, Jianfeng Gao, Li Deng, and Gr\u00e9goire Mesnil. 2014. A Latent Semantic Model with Convolutional-Pooling Structure for Information Retrieval. In CIKM, 2014. 101--110.","journal-title":"CIKM"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/2567948.2577348"},{"key":"e_1_3_2_1_35_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan N. Gomez Lukasz Kaiser and Illia Polosukhin. 2017. Attention is All you Need. In NeurIPS. 6000--6010."},{"key":"e_1_3_2_1_36_1","first-page":"5776","article-title":"Minilm: Deep self-attention distillation for task-agnostic compression of pre-trained transformers","volume":"33","author":"Wang Wenhui","year":"2020","unstructured":"Wenhui Wang, Furu Wei, Li Dong, Hangbo Bao, Nan Yang, and Ming Zhou. 2020. Minilm: Deep self-attention distillation for task-agnostic compression of pre-trained transformers. NeurIPS 33 (2020), 5776--5788.","journal-title":"NeurIPS"},{"key":"e_1_3_2_1_37_1","volume-title":"Transformers: State-of-the-Art Natural Language Processing. In EMNLP.","author":"Thomas Wolf","year":"2020","unstructured":"Thomas Wolf et al. 2020. Transformers: State-of-the-Art Natural Language Processing. In EMNLP."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.sustainlp-1.11"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3077136.3080809"},{"key":"e_1_3_2_1_40_1","volume-title":"Russell Power, and Jamie Callan","author":"Xiong Chenyan","year":"2017","unstructured":"Chenyan Xiong, Russell Power, and Jamie Callan. 2017. Explicit Semantic Ranking for Academic Search via Knowledge Graph Embedding. In WWW, 2017. 1271-- 1279."},{"key":"e_1_3_2_1_41_1","volume-title":"Approximate nearest neighbor negative contrastive learning for dense text retrieval. arXiv preprint arXiv:2007.00808","author":"Xiong Lee","year":"2020","unstructured":"Lee Xiong, Chenyan Xiong, Ye Li, Kwok-Fung Tang, Jialin Liu, Paul Bennett, Junaid Ahmed, and Arnold Overwijk. 2020. Approximate nearest neighbor negative contrastive learning for dense text retrieval. arXiv preprint arXiv:2007.00808 (2020)."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3366424.3386195"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3442381.3450129"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467147"}],"event":{"name":"KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Washington DC USA","acronym":"KDD '22","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3534678.3539164","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3534678.3539164","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:02:58Z","timestamp":1750186978000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3534678.3539164"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,14]]},"references-count":44,"alternative-id":["10.1145\/3534678.3539164","10.1145\/3534678"],"URL":"https:\/\/doi.org\/10.1145\/3534678.3539164","relation":{},"subject":[],"published":{"date-parts":[[2022,8,14]]},"assertion":[{"value":"2022-08-14","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}