{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:01:28Z","timestamp":1750309288846,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":35,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,1]],"date-time":"2024-10-01T00:00:00Z","timestamp":1727740800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Key R&D Program of China","award":["2023YFB4502400"],"award-info":[{"award-number":["2023YFB4502400"]}]},{"name":"China NSF grant","award":["62322206","62132018","U2268204","62025204","62272307","62372296"],"award-info":[{"award-number":["62322206","62132018","U2268204","62025204","62272307","62372296"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,14]]},"DOI":"10.1145\/3641512.3686360","type":"proceedings-article","created":{"date-parts":[[2024,10,1]],"date-time":"2024-10-01T21:11:22Z","timestamp":1727817082000},"page":"51-60","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["On the Analysis of Two-Stage Stochastic Bandit"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-0068-8624","authenticated-orcid":false,"given":"Yumou","family":"Liu","sequence":"first","affiliation":[{"name":"The Chinese University of Hong Kong, Shenzhen, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-8221-0717","authenticated-orcid":false,"given":"Haoming","family":"Li","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5094-5331","authenticated-orcid":false,"given":"Zhenzhe","family":"Zheng","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0965-9058","authenticated-orcid":false,"given":"Fan","family":"Wu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6934-1685","authenticated-orcid":false,"given":"Guihai","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2024,10]]},"reference":[{"doi-asserted-by":"publisher","key":"e_1_3_2_1_1_1","DOI":"10.1145\/3383313.3412217"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_2_1","DOI":"10.1145\/2939672.2939718"},{"key":"e_1_3_2_1_3_1","volume-title":"An empirical evaluation of thompson sampling. Advances in neural information processing systems 24","author":"Chapelle O.","year":"2011","unstructured":"Chapelle, O., and Li, L. An empirical evaluation of thompson sampling. Advances in neural information processing systems 24 (2011)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_4_1","DOI":"10.1145\/2959100.2959190"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_5_1","DOI":"10.1145\/1242572.1242610"},{"key":"e_1_3_2_1_6_1","volume-title":"Syndicated bandits: A framework for auto tuning hyper-parameters in contextual bandit algorithms. Advances in Neural Information Processing Systems","author":"Ding Q.","year":"2022","unstructured":"Ding, Q., Kang, Y., Liu, Y.-W., Lee, T. C. M., Hsieh, C.-J., and Sharpnack, J. Syndicated bandits: A framework for auto tuning hyper-parameters in contextual bandit algorithms. Advances in Neural Information Processing Systems (2022), 1170--1181."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_7_1","DOI":"10.1145\/3240323.3240387"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_8_1","DOI":"10.1145\/3511808.3557065"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_9_1","DOI":"10.1145\/3340531.3412700"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_10_1","DOI":"10.1145\/3383313.3412214"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_11_1","DOI":"10.1145\/3523227.3551468"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_12_1","DOI":"10.1145\/3097983.3098184"},{"key":"e_1_3_2_1_13_1","volume-title":"On component interactions in two-stage recommender systems. Advances in neural information processing systems 34","author":"Hron J.","year":"2021","unstructured":"Hron, J., Krauth, K., Jordan, M., and Kilbertus, N. On component interactions in two-stage recommender systems. Advances in neural information processing systems 34 (2021), 2744--2757."},{"key":"e_1_3_2_1_14_1","volume-title":"Exploration in two-stage recommender systems. arXiv preprint arXiv:2009.08956","author":"Hron J.","year":"2020","unstructured":"Hron, J., Krauth, K., Jordan, M. I., and Kilbertus, N. Exploration in two-stage recommender systems. arXiv preprint arXiv:2009.08956 (2020)."},{"key":"e_1_3_2_1_15_1","volume-title":"Towards a theoretical understanding of two-stage recommender systems","author":"Jaiswal A. K.","year":"2024","unstructured":"Jaiswal, A. K. Towards a theoretical understanding of two-stage recommender systems, 2024."},{"key":"e_1_3_2_1_16_1","first-page":"1215","volume-title":"International Conference on Machine Learning","author":"Katariya S.","year":"2016","unstructured":"Katariya, S., Kveton, B., Szepesvari, C., and Wen, Z. Dcm bandits: Learning to rank with multiple clicks. In International Conference on Machine Learning (2016), pp. 1215--1224."},{"key":"e_1_3_2_1_17_1","first-page":"767","volume-title":"International Conference on Machine Learning","author":"Kveton B.","year":"2015","unstructured":"Kveton, B., Szepesvari, C., Wen, Z., and Ashkan, A. Cascading bandits: Learning to rank in the cascade model. In International Conference on Machine Learning (2015), pp. 767--776."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_18_1","DOI":"10.1017\/9781108571401"},{"key":"e_1_3_2_1_19_1","volume-title":"WWW","author":"Li L.","year":"2010","unstructured":"Li, L., Chu, W., Langford, J., and Schapire, R. E. A contextual-bandit approach to personalized news article recommendation. In WWW (2010)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_20_1","DOI":"10.1145\/3041021.3054202"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_21_1","DOI":"10.1145\/3523227.3547396"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_22_1","DOI":"10.1145\/3404835.3462979"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_23_1","DOI":"10.1145\/3209978.3210104"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_24_1","DOI":"10.1145\/3240323.3240354"},{"key":"e_1_3_2_1_25_1","volume-title":"Probabilistic matrix factorization. Advances in Neural Information Processing Systems","author":"Mnih A.","year":"2007","unstructured":"Mnih, A., and Salakhutdinov, R. R. Probabilistic matrix factorization. Advances in Neural Information Processing Systems (2007), 1257--1264."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_26_1","DOI":"10.1145\/3372224.3419188"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_27_1","DOI":"10.5555\/1768197.1768209"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_28_1","DOI":"10.1145\/3219819.3219869"},{"key":"e_1_3_2_1_29_1","volume-title":"Cold: Towards the next generation of pre-ranking system. arXiv preprint arXiv:2007.16122","author":"Wang Z.","year":"2020","unstructured":"Wang, Z., Zhao, L., Jiang, B., Zhou, G., Zhu, X., and Gai, K. Cold: Towards the next generation of pre-ranking system. arXiv preprint arXiv:2007.16122 (2020)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_30_1","DOI":"10.1145\/3534678.3539181"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_31_1","DOI":"10.1145\/3447548.3467097"},{"key":"e_1_3_2_1_32_1","volume-title":"On-device recommender systems: A comprehensive survey. arXiv preprint arXiv:2401.11441","author":"Yin H.","year":"2024","unstructured":"Yin, H., Qu, L., Chen, T., Yuan, W., Zheng, R., Long, J., Xia, X., Shi, Y., and Zhang, C. On-device recommender systems: A comprehensive survey. arXiv preprint arXiv:2401.11441 (2024)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_33_1","DOI":"10.1609\/aaai.v32i1.11601"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_34_1","DOI":"10.1145\/3219819.3219823"},{"key":"e_1_3_2_1_35_1","first-page":"4199","volume-title":"International Conference on Machine Learning","author":"Zoghi M.","year":"2017","unstructured":"Zoghi, M., Tunys, T., Ghavamzadeh, M., Kveton, B., Szepesvari, C., and Wen, Z. Online learning to rank in stochastic click models. In International Conference on Machine Learning (2017), pp. 4199--4208."}],"event":{"sponsor":["SIGMOBILE ACM Special Interest Group on Mobility of Systems, Users, Data and Computing"],"acronym":"MobiHoc '24","name":"MobiHoc '24: Twenty-fifth International Symposium on Theory, Algorithmic Foundations, and Protocol Design for Mobile Networks and Mobile Computing","location":"Athens Greece"},"container-title":["Proceedings of the Twenty-fifth International Symposium on Theory, Algorithmic Foundations, and Protocol Design for Mobile Networks and Mobile Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3641512.3686360","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3641512.3686360","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:03:22Z","timestamp":1750291402000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3641512.3686360"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10]]},"references-count":35,"alternative-id":["10.1145\/3641512.3686360","10.1145\/3641512"],"URL":"https:\/\/doi.org\/10.1145\/3641512.3686360","relation":{},"subject":[],"published":{"date-parts":[[2024,10]]},"assertion":[{"value":"2024-10-01","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}