{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T10:08:39Z","timestamp":1775815719310,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":33,"publisher":"ACM","license":[{"start":{"date-parts":[[2018,10,17]],"date-time":"2018-10-17T00:00:00Z","timestamp":1539734400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2018,10,17]]},"DOI":"10.1145\/3269206.3271748","type":"proceedings-article","created":{"date-parts":[[2018,10,22]],"date-time":"2018-10-22T12:08:27Z","timestamp":1540210107000},"page":"1443-1451","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":83,"title":["Budget Constrained Bidding by Model-free Reinforcement Learning in Display Advertising"],"prefix":"10.1145","author":[{"given":"Di","family":"Wu","sequence":"first","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Xiujun","family":"Chen","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Xun","family":"Yang","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Hao","family":"Wang","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Qing","family":"Tan","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Xiaoxun","family":"Zhang","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Jian","family":"Xu","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]},{"given":"Kun","family":"Gai","sequence":"additional","affiliation":[{"name":"Alibaba Group, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2018,10,17]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2017. IAB internet advertising revenue report. https:\/\/www.iab.com\/wp-content\/uploads\/2017\/12\/IAB-Internet-Ad-Revenue-Report-Half-Year-2017-REPORT. pdf.  2017. IAB internet advertising revenue report. https:\/\/www.iab.com\/wp-content\/uploads\/2017\/12\/IAB-Internet-Ad-Revenue-Report-Half-Year-2017-REPORT. pdf."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/1250910.1250950"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","volume-title":"Constrained Markov decision processes","author":"Altman Eitan","DOI":"10.1201\/9781315140223"},{"key":"e_1_3_2_1_4_1","volume-title":"Budget optimization for sponsored search: Censored learning in MDPs. arXiv preprint arXiv:1210.4847","author":"Amin Kareem","year":"2012"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Santiago Balseiro and Yonatan Gur. 2017. Learning in repeated auctions with budgets: Regret minimization and equilibrium. (2017).  Santiago Balseiro and Yonatan Gur. 2017. Learning in repeated auctions with budgets: Regret minimization and equilibrium. (2017).","DOI":"10.1145\/3033274.3084088"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3038912.3052682"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/1242572.1242644"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3018661.3018702"},{"key":"e_1_3_2_1_9_1","volume-title":"Stier-Moses","author":"Conitzer Vincent","year":"2017"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1287\/opre.5.2.266"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-69179-4_50"},{"key":"e_1_3_2_1_12_1","volume-title":"Internet advertising and the generalized second-price auction: Selling billions of dollars worth of keywords. American economic review 97, 1","author":"Edelman Benjamin","year":"2007"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/1526709.1526744"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1137\/120874679"},{"key":"e_1_3_2_1_15_1","unstructured":"John Hegeman Rong Yan and Gregory Joseph Badros. 2011. Budget-based advertisment bidding. US Patent 20130124308A1.  John Hegeman Rong Yan and Gregory Joseph Badros. 2011. Budget-based advertisment bidding. US Patent 20130124308A1."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.orl.2013.12.009"},{"key":"e_1_3_2_1_17_1","volume-title":"Auction theory","author":"Krishna Vijay"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2001.970573"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/2501040.2501979"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/2339530.2339651"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/2983323.2983656"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/2487575.2488200"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/1284320.1284321"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"Volodymyr Mnih Koray Kavukcuoglu David Silver Andrei A. Rusu Joel Veness Marc G. Bellemare Alex Graves Martin Riedmiller Andreas K. Fidjeland Georg Ostrovski etal 2015. Human-level control through deep reinforcement learning. Nature 518 7540 (2015) 529--533.  Volodymyr Mnih Koray Kavukcuoglu David Silver Andrei A. Rusu Joel Veness Marc G. Bellemare Alex Graves Martin Riedmiller Andreas K. Fidjeland Georg Ostrovski et al. 2015. Human-level control through deep reinforcement learning. Nature 518 7540 (2015) 529--533.","DOI":"10.1038\/nature14236"},{"key":"e_1_3_2_1_25_1","volume-title":"Vazirani","author":"Nisan Noam","year":"2007"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/2339530.2339655"},{"key":"e_1_3_2_1_27_1","volume-title":"Barto","author":"Sutton Richard S.","year":"1998"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/2684822.2697041"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2396761.2396828"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2501040.2501980"},{"key":"e_1_3_2_1_31_1","volume-title":"Optimal real-time bidding frameworks discussion. arXiv preprint arXiv:1602.01007","author":"Zhang Weinan","year":"2016"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623633"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-92185-1_63"}],"event":{"name":"CIKM '18: The 27th ACM International Conference on Information and Knowledge Management","location":"Torino Italy","acronym":"CIKM '18","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the 27th ACM International Conference on Information and Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3269206.3271748","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3269206.3271748","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:44:29Z","timestamp":1750207469000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3269206.3271748"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10,17]]},"references-count":33,"alternative-id":["10.1145\/3269206.3271748","10.1145\/3269206"],"URL":"https:\/\/doi.org\/10.1145\/3269206.3271748","relation":{},"subject":[],"published":{"date-parts":[[2018,10,17]]},"assertion":[{"value":"2018-10-17","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}