{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T06:58:20Z","timestamp":1776063500354,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":57,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,4,25]],"date-time":"2022-04-25T00:00:00Z","timestamp":1650844800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100002358","name":"Beihang University","doi-asserted-by":"publisher","award":["21340301D"],"award-info":[{"award-number":["21340301D"]}],"id":[{"id":"10.13039\/501100002358","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["III-1763325, III-1909323, III-2106758, SaTC-1930941"],"award-info":[{"award-number":["III-1763325, III-1909323, III-2106758, SaTC-1930941"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,4,25]]},"DOI":"10.1145\/3485447.3512077","type":"proceedings-article","created":{"date-parts":[[2022,4,25]],"date-time":"2022-04-25T05:11:23Z","timestamp":1650863483000},"page":"2036-2047","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":161,"title":["Sequential Recommendation via Stochastic Self-Attention"],"prefix":"10.1145","author":[{"given":"Ziwei","family":"Fan","sequence":"first","affiliation":[{"name":"University of Illinois at Chicago, USA"}]},{"given":"Zhiwei","family":"Liu","sequence":"additional","affiliation":[{"name":"University of Illinois at Chicago, USA"}]},{"given":"Yu","family":"Wang","sequence":"additional","affiliation":[{"name":"University of Illinois at Chicago, USA"}]},{"given":"Alice","family":"Wang","sequence":"additional","affiliation":[{"name":"Spotify Research, USA"}]},{"given":"Zahra","family":"Nazari","sequence":"additional","affiliation":[{"name":"Spotify Research, USA"}]},{"given":"Lei","family":"Zheng","sequence":"additional","affiliation":[{"name":"Pinterest Inc., USA"}]},{"given":"Hao","family":"Peng","sequence":"additional","affiliation":[{"name":"Beihang University, China"}]},{"given":"Philip S.","family":"Yu","sequence":"additional","affiliation":[{"name":"University of Illinois at Chicago, USA"}]}],"member":"320","published-online":{"date-parts":[[2022,4,25]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=r1ZdKJ-0W","author":"Bojchevski Aleksandar","year":"2018","unstructured":"Aleksandar Bojchevski and Stephan G\u00fcnnemann. 2018. Deep Gaussian Embedding of Graphs: Unsupervised Inductive Learning via Ranking. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=r1ZdKJ-0W"},{"key":"e_1_3_2_1_2_1","unstructured":"Jiawei Chen Hande Dong Xiang Wang Fuli Feng Meng Wang and Xiangnan He. 2020. Bias and debias in recommender system: A survey and future directions. arXiv preprint arXiv:2010.03240(2020)."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1090\/S0002-9939-07-09020-X"},{"key":"e_1_3_2_1_4_1","volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805(2018).","author":"Devlin Jacob","year":"2018","unstructured":"Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2018. Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805(2018)."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177706708"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482242"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Ziwei Fan Zhiwei Liu Lei Zheng Shen Wang and Philip\u00a0S Yu. 2021. Modeling Sequences as Distributions with Uncertainty for Sequential Recommendation. arXiv preprint arXiv:2106.06165(2021).","DOI":"10.1145\/3459637.3482145"},{"key":"e_1_3_2_1_8_1","volume-title":"A survey of graph edit distance. Pattern Analysis and applications 13, 1","author":"Gao Xinbo","year":"2010","unstructured":"Xinbo Gao, Bing Xiao, Dacheng Tao, and Xuelong Li. 2010. A survey of graph edit distance. Pattern Analysis and applications 13, 1 (2010), 113\u2013129."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401057"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3109859.3109882"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2016.0030"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2806416.2806502"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401063"},{"key":"e_1_3_2_1_14_1","unstructured":"Bal\u00e1zs Hidasi Alexandros Karatzoglou Linas Baltrunas and Domonkos Tikk. 2015. Session-based recommendations with recurrent neural networks. arXiv preprint arXiv:1511.06939(2015)."},{"key":"e_1_3_2_1_15_1","volume-title":"Long short-term memory. Neural computation 9, 8","author":"Hochreiter Sepp","year":"1997","unstructured":"Sepp Hochreiter and J\u00fcrgen Schmidhuber. 1997. Long short-term memory. Neural computation 9, 8 (1997), 1735\u20131780."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3038912.3052639"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2018.00035"},{"key":"e_1_3_2_1_18_1","volume-title":"Kingma and Jimmy Ba","author":"P.","year":"2015","unstructured":"Diederik\u00a0P. Kingma and Jimmy Ba. 2015. Adam: A Method for Stochastic Optimization. In 3rd International Conference on Learning Representations, ICLR 2015, San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings, Yoshua Bengio and Yann LeCun (Eds.). http:\/\/arxiv.org\/abs\/1412.6980"},{"key":"e_1_3_2_1_19_1","volume-title":"Sliced Wasserstein Auto-Encoders. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=H1xaJn05FQ","author":"Kolouri Soheil","year":"2019","unstructured":"Soheil Kolouri, Phillip\u00a0E. Pope, Charles\u00a0E. Martin, and Gustavo\u00a0K. Rohde. 2019. Sliced Wasserstein Auto-Encoders. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=H1xaJn05FQ"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403226"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3380260"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3336191.3371786"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5894"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3372297.3417271"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/3404835.3463036"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/BigData50022.2020.9377917"},{"key":"e_1_3_2_1_27_1","unstructured":"Zhiwei Liu Liangwei Yang Ziwei Fan Hao Peng and Philip\u00a0S Yu. 2021. Federated Social Recommendation with Graph Neural Network. arXiv preprint arXiv:2111.10778(2021)."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330984"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403147"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF02834632"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401101"},{"key":"e_1_3_2_1_32_1","volume-title":"HAM: hybrid associations models for sequential recommendation","author":"Peng Bo","year":"2021","unstructured":"Bo Peng, Zhiyun Ren, Srinivasan Parthasarathy, and Xia Ning. 2021. HAM: hybrid associations models for sequential recommendation. IEEE Transactions on Knowledge and Data Engineering (2021)."},{"key":"e_1_3_2_1_33_1","volume-title":"International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=HJeiDpVFPr","author":"Pitis Silviu","year":"2020","unstructured":"Silviu Pitis, Harris Chan, Kiarash Jamali, and Jimmy Ba. 2020. An Inductive Bias for Distances: Neural Nets that Respect the Triangle Inequality. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=HJeiDpVFPr"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i15.17613"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3109859.3109896"},{"key":"e_1_3_2_1_36_1","volume-title":"BPR: Bayesian personalized ranking from implicit feedback. arXiv preprint arXiv:1205.2618(2012).","author":"Rendle Steffen","year":"2012","unstructured":"Steffen Rendle, Christoph Freudenthaler, Zeno Gantner, and Lars Schmidt-Thieme. 2012. BPR: Bayesian personalized ranking from implicit feedback. arXiv preprint arXiv:1205.2618(2012)."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/1772690.1772773"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00532240"},{"key":"e_1_3_2_1_39_1","unstructured":"Chi Sun Hang Yan Xipeng Qiu and Xuanjing Huang. 2018. Gaussian word embedding with a wasserstein distance loss. arXiv preprint arXiv:1808.07016(2018)."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3357895"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3159652.3159656"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3178876.3186154"},{"key":"e_1_3_2_1_43_1","volume-title":"Visualizing data using t-SNE.Journal of machine learning research 9, 11","author":"Maaten Laurens Van\u00a0der","year":"2008","unstructured":"Laurens Van\u00a0der Maaten and Geoffrey Hinton. 2008. Visualizing data using t-SNE.Journal of machine learning research 9, 11 (2008)."},{"key":"e_1_3_2_1_44_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N Gomez \u0141ukasz Kaiser and Illia Polosukhin. 2017. Attention is all you need. In Advances in neural information processing systems. 5998\u20136008."},{"key":"e_1_3_2_1_45_1","unstructured":"Luke Vilnis and Andrew McCallum. 2014. Word representations via gaussian embedding. arXiv preprint arXiv:1412.6623(2014)."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"crossref","unstructured":"Chen Wang Yueqing Liang Zhiwei Liu Tao Zhang and Philip\u00a0S Yu. 2021. Pre-training Graph Neural Network for Cross Domain Recommendation. arXiv preprint arXiv:2111.08268(2021).","DOI":"10.1109\/CogMI52975.2021.00026"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482092"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3383313.3412258"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3358113"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219890"},{"key":"e_1_3_2_1_51_1","volume-title":"MZET: Memory Augmented Zero-Shot Fine-grained Named Entity Typing. arXiv preprint arXiv:2004.01267(2020).","author":"Zhang Tao","year":"2020","unstructured":"Tao Zhang, Congying Xia, Chun-Ta Lu, and Philip Yu. 2020. MZET: Memory Augmented Zero-Shot Fine-grained Named Entity Typing. arXiv preprint arXiv:2004.01267(2020)."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.442"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331329"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331330"},{"key":"e_1_3_2_1_55_1","unstructured":"Yao Zhou Haonan Wang Jingrui He and Haixun Wang. 2021. From Intrinsic to Counterfactual: On the Explainability of Contextualized Recommender Systems. arXiv preprint arXiv:2110.14844(2021)."},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467234"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220052"}],"event":{"name":"WWW '22: The ACM Web Conference 2022","location":"Virtual Event, Lyon France","acronym":"WWW '22","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"]},"container-title":["Proceedings of the ACM Web Conference 2022"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3485447.3512077","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3485447.3512077","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3485447.3512077","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:30:07Z","timestamp":1750188607000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3485447.3512077"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,4,25]]},"references-count":57,"alternative-id":["10.1145\/3485447.3512077","10.1145\/3485447"],"URL":"https:\/\/doi.org\/10.1145\/3485447.3512077","relation":{},"subject":[],"published":{"date-parts":[[2022,4,25]]},"assertion":[{"value":"2022-04-25","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}