{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T05:45:41Z","timestamp":1777873541440,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","funder":[{"name":"Yonghua Foundation"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,3]]},"DOI":"10.1145\/3711896.3737276","type":"proceedings-article","created":{"date-parts":[[2025,8,3]],"date-time":"2025-08-03T21:03:27Z","timestamp":1754255007000},"page":"5129-5138","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Leveraging Label Distributions as Anchors to Enhance Video Recommendation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-6587-9781","authenticated-orcid":false,"given":"Yulin","family":"Xu","sequence":"first","affiliation":[{"name":"University of California, Irvine, Irvine, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-2097-7888","authenticated-orcid":false,"given":"Chao","family":"Cui","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4550-3950","authenticated-orcid":false,"given":"Shisong","family":"Tang","sequence":"additional","affiliation":[{"name":"KuaiShou Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-7772-9523","authenticated-orcid":false,"given":"Fan","family":"Li","sequence":"additional","affiliation":[{"name":"KuaiShou Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-5044-6368","authenticated-orcid":false,"given":"Bing","family":"Han","sequence":"additional","affiliation":[{"name":"KuaiShou Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-6414-3303","authenticated-orcid":false,"given":"Huafeng","family":"Cao","sequence":"additional","affiliation":[{"name":"Kuaishou Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0628-1416","authenticated-orcid":false,"given":"Jiechao","family":"Gao","sequence":"additional","affiliation":[{"name":"Center for SDGC, Stanford University, Palo Alto, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7835-9556","authenticated-orcid":false,"given":"Hechang","family":"Chen","sequence":"additional","affiliation":[{"name":"Jilin University, Jilin, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,8,3]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_9"},{"key":"e_1_3_2_2_2_1","volume-title":"Unsupervised learning of visual features by contrasting cluster assignments. Advances in neural information processing systems","author":"Caron Mathilde","year":"2020","unstructured":"Mathilde Caron, Ishan Misra, Julien Mairal, Priya Goyal, Piotr Bojanowski, and Armand Joulin. 2020. Unsupervised learning of visual features by contrasting cluster assignments. Advances in neural information processing systems, Vol. 33 (2020), 9912-9924."},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/2959100.2959190"},{"key":"e_1_3_2_2_4_1","volume-title":"Pranking with ranking. Advances in neural information processing systems","author":"Crammer Koby","year":"2001","unstructured":"Koby Crammer and Yoram Singer. 2001. Pranking with ranking. Advances in neural information processing systems, Vol. 14 (2001)."},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/1864708.1864770"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01268"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3511808.3557220"},{"key":"e_1_3_2_2_8_1","volume-title":"Proceedings of the fourteenth international conference on artificial intelligence and statistics. JMLR Workshop and Conference Proceedings, 315-323","author":"Glorot Xavier","year":"2011","unstructured":"Xavier Glorot, Antoine Bordes, and Yoshua Bengio. 2011. Deep sparse rectifier neural networks. In Proceedings of the fourteenth international conference on artificial intelligence and statistics. JMLR Workshop and Conference Proceedings, 315-323."},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/3511808.3557065"},{"key":"e_1_3_2_2_10_1","unstructured":"Eric Jang Shixiang Gu and Ben Poole. 2016. Categorical reparameterization with gumbel-softmax. arXiv preprint arXiv:1611.01144(2016)."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"crossref","unstructured":"Zhuxi Jiang Yin Zheng Huachun Tan Bangsheng Tang and Hanning Zhou. 2016. Variational deep embedding: An unsupervised and generative approach to clustering. arXiv preprint arXiv:1611.05148(2016).","DOI":"10.24963\/ijcai.2017\/273"},{"key":"e_1_3_2_2_12_1","volume-title":"Kamran Aziz, Simon Fong, and Sababady Sarasvady.","author":"Khan Kamran","year":"2014","unstructured":"Kamran Khan, Saif Ur Rehman, Kamran Aziz, Simon Fong, and Sababady Sarasvady. 2014. DBSCAN: Past, present and future. In The fifth international conference on the applications of digital information and web technologies (ICADIWT 2014). IEEE, 232-238."},{"key":"e_1_3_2_2_13_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980(2014).","author":"Kingma Diederik P","year":"2014","unstructured":"Diederik P Kingma and Jimmy Ba. 2014. Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980(2014)."},{"key":"e_1_3_2_2_14_1","volume-title":"Seed-bench: Benchmarking multimodal llms with generative comprehension. arXiv preprint arXiv:2307.16125(2023).","author":"Li Bohao","year":"2023","unstructured":"Bohao Li, Rui Wang, Guangzhi Wang, Yuying Ge, Yixiao Ge, and Ying Shan. 2023. Seed-bench: Benchmarking multimodal llms with generative comprehension. arXiv preprint arXiv:2307.16125(2023)."},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671514"},{"key":"e_1_3_2_2_16_1","volume-title":"AAAI 2025 Workshop on Artificial Intelligence with Causal Techniques. https:\/\/openreview.net\/forum?id=7btnaN4Std","author":"Li Meng","year":"2025","unstructured":"Meng Li and Haochen Sui. 2025. Causal Recommendation via Machine Unlearning with a Few Unbiased Data. In AAAI 2025 Workshop on Artificial Intelligence with Causal Techniques. https:\/\/openreview.net\/forum?id=7btnaN4Std"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i10.17037"},{"key":"e_1_3_2_2_18_1","volume-title":"The global k-means clustering algorithm. Pattern recognition","author":"Likas Aristidis","year":"2003","unstructured":"Aristidis Likas, Nikos Vlassis, and Jakob J Verbeek. 2003. The global k-means clustering algorithm. Pattern recognition, Vol. 36, 2 (2003), 451-461."},{"key":"e_1_3_2_2_19_1","unstructured":"Chengzhi Lin Shuchang Liu Chuyuan Wang and Yongqi Liu. 2024. Conditional Quantile Estimation for Uncertain Watch Time in Short-Video Recommendation. arXiv preprint arXiv:2407.12223(2024)."},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599919"},{"key":"e_1_3_2_2_21_1","unstructured":"Qijiong Liu Xiaoyu Dong Jiaren Xiao Nuo Chen Hengchang Hu Jieming Zhu Chenxu Zhu Tetsuya Sakai and Xiao-Ming Wu. 2024a. Vector Quantization for Recommender Systems: A Review and Outlook. arXiv preprint arXiv:2405.03110(2024)."},{"key":"e_1_3_2_2_22_1","first-page":"1","article-title":"Multimodal recommender systems: A survey","volume":"57","author":"Liu Qidong","year":"2024","unstructured":"Qidong Liu, Jiaxi Hu, Yutian Xiao, Xiangyu Zhao, Jingtong Gao, Wanyu Wang, Qing Li, and Jiliang Tang. 2024b. Multimodal recommender systems: A survey. Comput. Surveys, Vol. 57, 2 (2024), 1-17.","journal-title":"Comput. Surveys"},{"key":"e_1_3_2_2_23_1","unstructured":"Hongxu Ma Kai Tian Tao Zhang Xuefeng Zhang Chunjie Chen Han Li Jihong Guan and Shuigeng Zhou. 2024. Generative Regression Based Watch Time Prediction for Video Recommendation: Model and Performance. arXiv preprint arXiv:2412.20211(2024)."},{"key":"e_1_3_2_2_24_1","volume-title":"Early stopping-but when? In Neural Networks: Tricks of the trade","author":"Prechelt Lutz","unstructured":"Lutz Prechelt. 2002. Early stopping-but when? In Neural Networks: Tricks of the trade. Springer, 55-69."},{"key":"e_1_3_2_2_25_1","volume-title":"Trung Vu, Lukasz Heldt, Lichan Hong, Yi Tay, Vinh Tran, Jonah Samost, et al.","author":"Rajput Shashank","year":"2024","unstructured":"Shashank Rajput, Nikhil Mehta, Anima Singh, Raghunandan Hulikal Keshavan, Trung Vu, Lukasz Heldt, Lichan Hong, Yi Tay, Vinh Tran, Jonah Samost, et al., 2024. Recommender systems with generative retrieval. Advances in Neural Information Processing Systems, Vol. 36 (2024)."},{"key":"e_1_3_2_2_26_1","volume-title":"Hierarchical text-conditional image generation with clip latents. arXiv preprint arXiv:2204.06125","author":"Ramesh Aditya","year":"2022","unstructured":"Aditya Ramesh, Prafulla Dhariwal, Alex Nichol, Casey Chu, and Mark Chen. 2022. Hierarchical text-conditional image generation with clip latents. arXiv preprint arXiv:2204.06125, Vol. 1, 2 (2022), 3."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"crossref","unstructured":"Douglas A Reynolds et al. 2009. Gaussian mixture models. Encyclopedia of biometrics Vol. 741 659-663 (2009).","DOI":"10.1007\/978-0-387-73003-5_196"},{"key":"e_1_3_2_2_28_1","volume-title":"Dropout: a simple way to prevent neural networks from overfitting. The journal of machine learning research","author":"Srivastava Nitish","year":"2014","unstructured":"Nitish Srivastava, Geoffrey Hinton, Alex Krizhevsky, Ilya Sutskever, and Ruslan Salakhutdinov. 2014. Dropout: a simple way to prevent neural networks from overfitting. The journal of machine learning research, Vol. 15, 1 (2014), 1929-1958."},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i8.28752"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3485447.3511934"},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599797"},{"key":"e_1_3_2_2_32_1","unstructured":"Aaron Van Den Oord Oriol Vinyals et al. 2017. Neural discrete representation learning. Advances in neural information processing systems Vol. 30 (2017)."},{"key":"e_1_3_2_2_33_1","volume-title":"Neural Discrete Representation Learning. CoRR","author":"van den Oord A\u00e4ron","year":"2017","unstructured":"A\u00e4ron van den Oord, Oriol Vinyals, and Koray Kavukcuoglu. 2017. Neural Discrete Representation Learning. CoRR, Vol. abs\/1711.00937 (2017). arXiv:1711.00937 http:\/\/arxiv.org\/abs\/1711.00937"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"crossref","unstructured":"C\u00e9dric Villani et al. 2009. Optimal transport: old and new. Vol. 338. Springer.","DOI":"10.1007\/978-3-540-71050-9"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.6108"},{"key":"e_1_3_2_2_36_1","volume-title":"Invariant Spatiotemporal Representation Learning for Cross-patient Seizure Classification. In The First Workshop on NeuroAI @ NeurIPS2024","author":"Wu Yuntian","year":"2024","unstructured":"Yuntian Wu, Yuntian Yang, Jiabao Sean Xiao, Chuan Zhou, Haochen Sui, and Haoxuan Li. 2024. Invariant Spatiotemporal Representation Learning for Cross-patient Seizure Classification. In The First Workshop on NeuroAI @ NeurIPS2024. https:\/\/openreview.net\/forum?id=Ex6wAivo7G"},{"key":"e_1_3_2_2_37_1","first-page":"83","article-title":"Integrating AI for Enhanced Exploration of Video Recommendation Algorithm via Improved Collaborative Filtering","volume":"4","author":"Xiang Yafei","year":"2024","unstructured":"Yafei Xiang, Shuning Huo, Yichao Wu, Yulu Gong, and Mengran Zhu. 2024. Integrating AI for Enhanced Exploration of Video Recommendation Algorithm via Improved Collaborative Filtering. Journal of Theory and Practice of Engineering Science, Vol. 4, 02 (2024), 83-90.","journal-title":"Journal of Theory and Practice of Engineering Science"},{"key":"e_1_3_2_2_38_1","unstructured":"Shentao Yang Haichuan Yang Linna Du Adithya Ganesh Bo Peng Boying Liu Serena Li and Ji Liu. 2024. SWaT: Statistical Modeling of Video Watch Time through User Behavior Analysis. arXiv preprint arXiv:2408.07759(2024)."},{"key":"e_1_3_2_2_39_1","unstructured":"Penghang Yin Jiancheng Lyu Shuai Zhang Stanley Osher Yingyong Qi and Jack Xin. 2019. Understanding straight-through estimator in training activation quantized neural nets. arXiv preprint arXiv:1903.05662(2019)."},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642433"},{"key":"e_1_3_2_2_41_1","volume-title":"Anygpt: Unified multimodal llm with discrete sequence modeling. arXiv preprint arXiv:2402.12226(2024).","author":"Zhan Jun","year":"2024","unstructured":"Jun Zhan, Junqi Dai, Jiasheng Ye, Yunhua Zhou, Dong Zhang, Zhigeng Liu, Xin Zhang, Ruibin Yuan, Ge Zhang, Linyang Li, et al., 2024. Anygpt: Unified multimodal llm with discrete sequence modeling. arXiv preprint arXiv:2402.12226(2024)."},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"crossref","unstructured":"Ruohan Zhan Changhua Pei Qiang Su Jianfeng Wen Xueliang Wang Guanyu Mu Dong Zheng and Peng Jiang. 2022a. Deconfounding Duration Bias in Watch-time Prediction for Video Recommendation. arXiv:2206.06003 [cs.IR] https:\/\/arxiv.org\/abs\/2206.06003","DOI":"10.1145\/3534678.3539092"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3534678.3539092"},{"key":"e_1_3_2_2_44_1","volume-title":"Ninerec: A benchmark dataset suite for evaluating transferable recommendation","author":"Zhang Jiaqi","year":"2024","unstructured":"Jiaqi Zhang, Yu Cheng, Yongxin Ni, Yunzhu Pan, Zheng Yuan, Junchen Fu, Youhua Li, Jie Wang, and Fajie Yuan. 2024. Ninerec: A benchmark dataset suite for evaluating transferable recommendation. IEEE Transactions on Pattern Analysis and Machine Intelligence(2024)."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.fmre.2021.11.015"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671817"},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/3604915.3608797"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.02084"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548428"}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Toronto ON Canada","acronym":"KDD '25","sponsor":["SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.2"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3711896.3737276","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T18:01:31Z","timestamp":1777572091000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711896.3737276"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,3]]},"references-count":49,"alternative-id":["10.1145\/3711896.3737276","10.1145\/3711896"],"URL":"https:\/\/doi.org\/10.1145\/3711896.3737276","relation":{},"subject":[],"published":{"date-parts":[[2025,8,3]]},"assertion":[{"value":"2025-08-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}