{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T23:19:48Z","timestamp":1780355988343,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":33,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,2,2]],"date-time":"2017-02-02T00:00:00Z","timestamp":1485993600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,2,2]]},"DOI":"10.1145\/3018661.3018702","type":"proceedings-article","created":{"date-parts":[[2017,2,2]],"date-time":"2017-02-02T20:09:48Z","timestamp":1486066188000},"page":"661-670","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":158,"title":["Real-Time Bidding by Reinforcement Learning in Display Advertising"],"prefix":"10.1145","author":[{"given":"Han","family":"Cai","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kan","family":"Ren","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Weinan","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kleanthis","family":"Malialis","sequence":"additional","affiliation":[{"name":"University College London, London, United Kingdom"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jun","family":"Wang","sequence":"additional","affiliation":[{"name":"University College London, London, United Kingdom"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yong","family":"Yu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Defeng","family":"Guo","sequence":"additional","affiliation":[{"name":"Vlion Inc., Shanghai, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2017,2,2]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"UAI","author":"Amin K.","year":"2012","unstructured":"K. Amin , M. Kearns , P. Key , and A. Schwaighofer . Budget optimization for sponsored search: Censored learning in mdps . UAI , 2012 . K. Amin, M. Kearns, P. Key, and A. Schwaighofer. Budget optimization for sponsored search: Censored learning in mdps. UAI, 2012."},{"key":"e_1_3_2_1_2_1","first-page":"369","volume-title":"NIPS","author":"Boyan J.","year":"1995","unstructured":"J. Boyan and A. W. Moore . Generalization in reinforcement learning: Safely approximating the value function . NIPS , pages 369 -- 376 , 1995 . J. Boyan and A. W. Moore. Generalization in reinforcement learning: Safely approximating the value function. NIPS, pages 369--376, 1995."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623634"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2020408.2020604"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2020408.2020454"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.3386\/w11765"},{"key":"e_1_3_2_1_7_1","volume-title":"The arrival of real-time bidding","year":"2011","unstructured":"Google. The arrival of real-time bidding , 2011 . Google. The arrival of real-time bidding, 2011."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-377-6.50040-2"},{"key":"e_1_3_2_1_9_1","volume-title":"ICML","author":"Graepel T.","year":"2010","unstructured":"T. Graepel , J. Q. Candela , T. Borchert , and R. Herbrich . Web-scale bayesian click-through rate prediction for sponsored search advertising in microsoft's bing search engine . In ICML , 2010 . T. Graepel, J. Q. Candela, T. Borchert, and R. Herbrich. Web-scale bayesian click-through rate prediction for sponsored search advertising in microsoft's bing search engine. In ICML, 2010."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/2648584.2648589"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/1386790.1386794"},{"key":"e_1_3_2_1_12_1","volume-title":"Academic press","author":"Krishna V.","year":"2009","unstructured":"V. Krishna . Auction theory. Academic press , 2009 . V. Krishna. Auction theory. Academic press, 2009."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2501040.2501979"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/2339530.2339651"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-06608-0_37"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2487575.2488200"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/2556195.2556240"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/2339530.2339655"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1038\/nature16961"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143955"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/551283"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553504"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/2684822.2697041"},{"key":"e_1_3_2_1_24_1","volume-title":"Display advertising with real-time bidding (RTB) and behavioural targeting. arXiv preprint arXiv:1610.03013","author":"Wang J.","year":"2016","unstructured":"J. Wang , W. Zhang , and S. Yuan . Display advertising with real-time bidding (RTB) and behavioural targeting. arXiv preprint arXiv:1610.03013 , 2016 . J. Wang, W. Zhang, and S. Yuan. Display advertising with real-time bidding (RTB) and behavioural targeting. arXiv preprint arXiv:1610.03013, 2016."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46128-1_8"},{"key":"e_1_3_2_1_26_1","volume-title":"Q-learning. Machine learning, 8(3--4):279--292","author":"Watkins C. J.","year":"1992","unstructured":"C. J. Watkins and P. Dayan . Q-learning. Machine learning, 8(3--4):279--292 , 1992 . C. J. Watkins and P. Dayan. Q-learning. Machine learning, 8(3--4):279--292, 1992."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2783276"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2788615"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2396761.2396828"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2501040.2501980"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2783269"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623633"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939713"}],"event":{"name":"WSDM 2017: Tenth ACM International Conference on Web Search and Data Mining","location":"Cambridge United Kingdom","acronym":"WSDM 2017","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the Tenth ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3018661.3018702","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3018661.3018702","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:24:09Z","timestamp":1750220649000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3018661.3018702"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,2,2]]},"references-count":33,"alternative-id":["10.1145\/3018661.3018702","10.1145\/3018661"],"URL":"https:\/\/doi.org\/10.1145\/3018661.3018702","relation":{},"subject":[],"published":{"date-parts":[[2017,2,2]]},"assertion":[{"value":"2017-02-02","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}