{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:08:38Z","timestamp":1757617718117,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":47,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,9,22]]},"DOI":"10.1145\/3705328.3759308","type":"proceedings-article","created":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T10:46:13Z","timestamp":1757155573000},"page":"1228-1233","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Meta Off-Policy Estimation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6256-5814","authenticated-orcid":false,"given":"Olivier","family":"Jeunen","sequence":"first","affiliation":[{"name":"Aampe, Antwerp, Belgium"}]}],"member":"320","published-online":{"date-parts":[[2025,9,7]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"crossref","unstructured":"Alexander\u00a0C. Aitken. 1936. IV.\u2014On Least Squares and Linear Combination of Observations. Proc. of the Royal Society of Edinburgh 55 (1936) 42\u201348.","DOI":"10.1017\/S0370164600014346"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"crossref","unstructured":"Leo Breiman. 2001. Random Forests. Machine Learning 45 1 (2001) 5\u201332.","DOI":"10.1023\/A:1010933404324"},{"key":"e_1_3_3_1_4_2","volume-title":"Advances in Neural Information Processing Systems","author":"Chapelle Olivier","year":"2011","unstructured":"Olivier Chapelle and Lihong Li. 2011. An Empirical Evaluation of Thompson Sampling. In Advances in Neural Information Processing Systems , Vol.\u00a024. Curran Associates, Inc."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3289600.3290999"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.7758\/9781610448864"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"crossref","unstructured":"Olaf\u00a0M Dekkers. 2018. Meta-analysis: Key features potentials and misunderstandings. Res Pract Thromb Haemost 2 4 (Oct. 2018) 658\u2013663.","DOI":"10.1002\/rth2.12153"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"crossref","unstructured":"Miroslav Dud\u00edk Dumitru Erhan John Langford and Lihong Li. 2014. Doubly Robust Policy Evaluation and Optimization. Statist. Sci. 29 4 (2014) 485\u2013511.","DOI":"10.1214\/14-STS500"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"V\u00edctor Elvira Luca Martino and Christian\u00a0P. Robert. 2022. Rethinking the Effective Sample Size. International Statistical Review 90 3 (2022) 525\u2013550.","DOI":"10.1111\/insr.12500"},{"key":"e_1_3_3_1_10_2","series-title":"Proc. of Machine Learning Research","first-page":"1447","volume-title":"Proc. of the 35th International Conference on Machine Learning","volume":"80","author":"Farajtabar Mehrdad","year":"2018","unstructured":"Mehrdad Farajtabar, Yinlam Chow, and Mohammad Ghavamzadeh. 2018. More Robust Doubly Robust Off-policy Evaluation. In Proc. of the 35th International Conference on Machine Learning(Proc. of Machine Learning Research, Vol.\u00a080). PMLR, 1447\u20131456. https:\/\/proceedings.mlr.press\/v80\/farajtabar18a.html"},{"key":"e_1_3_3_1_11_2","unstructured":"Nicol\u00f2 Felicioni Michael Benigni and Maurizio\u00a0Ferrari Dacrema. 2024. Automated Off-Policy Estimator Selection via Supervised Learning. arxiv:https:\/\/arXiv.org\/abs\/2406.18022\u00a0[cs.LG]"},{"key":"e_1_3_3_1_12_2","series-title":"Proc. of Machine Learning Research","first-page":"1050","volume-title":"Proc. of The 33rd International Conference on Machine Learning","volume":"48","author":"Gal Yarin","year":"2016","unstructured":"Yarin Gal and Zoubin Ghahramani. 2016. Dropout as a Bayesian Approximation: Representing Model Uncertainty in Deep Learning. In Proc. of The 33rd International Conference on Machine Learning(Proc. of Machine Learning Research, Vol.\u00a048). PMLR, 1050\u20131059."},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"publisher","DOI":"10.1145\/2645710.2645745"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3159652.3159687"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.1145\/3289600.3291027"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3616855.3636451"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640457.3688105"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"crossref","unstructured":"Daniel\u00a0G. Horvitz and Donovan\u00a0J. Thompson. 1952. A Generalization of Sampling Without Replacement From a Finite Universe. J. Amer. Statist. Assoc. 47 260 (1952) 663\u2013685. http:\/\/www.jstor.org\/stable\/2280784","DOI":"10.1080\/01621459.1952.10483446"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"Edward\u00a0L. Ionides. 2008. Truncated Importance Sampling. Journal of Computational and Graphical Statistics 17 2 (2008) 295\u2013311.","DOI":"10.1198\/106186008X320456"},{"key":"e_1_3_3_1_20_2","unstructured":"Olivier Jeunen. 2021. Offline Approaches to Recommendation with Online Success. Ph.\u00a0D. Dissertation. University of Antwerp."},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.1145\/3604915.3608777"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"Olivier Jeunen. 2025. Counterfactual Inference under Thompson Sampling. arxiv:https:\/\/arXiv.org\/abs\/2504.08773\u00a0[cs.IR]","DOI":"10.1145\/3705328.3748011"},{"key":"e_1_3_3_1_23_2","series-title":"(REVEAL \u201920)","volume-title":"REVEAL Workshop at ACM RecSys \u201920","author":"Jeunen Olivier","year":"2020","unstructured":"Olivier Jeunen and Bart Goethals. 2020. An Empirical Evaluation of Doubly Robust Learning for Recommendation. In REVEAL Workshop at ACM RecSys \u201920(REVEAL \u201920)."},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","DOI":"10.1145\/3460231.3474247"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"crossref","unstructured":"Olivier Jeunen and Bart Goethals. 2023. Pessimistic Decision-Making for Recommender Systems. ACM Trans. Recomm. Syst. 1 1 Article 4 (feb 2023) 27\u00a0pages.","DOI":"10.1145\/3568029"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640457.3688132"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599877"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1145\/3637528.3671687"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","DOI":"10.1145\/3640457.3688162"},{"key":"e_1_3_3_1_30_2","series-title":"(REVEAL \u201918)","volume-title":"Workshop on Offline Evaluation for Recommender Systems at RecSys \u201918","author":"Jeunen Olivier","year":"2018","unstructured":"Olivier Jeunen, Koen Verstrepen, and Bart Goethals. 2018. Fair Offline Evaluation Methodologies for Implicit-Feedback Recommender Systems with MNAR Data. In Workshop on Offline Evaluation for Recommender Systems at RecSys \u201918(REVEAL \u201918)."},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"crossref","unstructured":"Thorsten Joachims Ben London Yi Su Adith Swaminathan and Lequn Wang. 2021. Recommendations as Treatments. AI Magazine 42 3 (Nov. 2021) 19\u201330.","DOI":"10.1609\/aimag.v42i3.18141"},{"key":"e_1_3_3_1_32_2","volume-title":"NIPS What If Workshop on Inference and Learning of Hypothetical and Counterfactual Interventions in Complex Systems","author":"Lefortier Damien","year":"2016","unstructured":"Damien Lefortier, Adith Swaminathan, Xiaotao Gu, Thorsten Joachims, and Maarten de Rijke. 2016. Large-scale Validation of Counterfactual Learning Methods: A Test-Bed. In NIPS What If Workshop on Inference and Learning of Hypothetical and Counterfactual Interventions in Complex Systems. arxiv:https:\/\/arXiv.org\/abs\/1612.00367\u00a0[cs.LG]"},{"key":"e_1_3_3_1_33_2","series-title":"(CONSEQUENCES \u201923)","volume-title":"CONSEQUENCES Workshop at ACM RecSys \u201923","author":"Lichtenberg Jan\u00a0Malte","year":"2023","unstructured":"Jan\u00a0Malte Lichtenberg, Alexander Buchholz, Giuseppe\u00a0Di Benedetto, Matteo Ruffini, and Ben London. 2023. Double Clipping: Less-Biased Variance Reduction in Off-Policy Evaluation. In CONSEQUENCES Workshop at ACM RecSys \u201923(CONSEQUENCES \u201923). arxiv:https:\/\/arXiv.org\/abs\/2309.01120\u00a0[cs.LG]"},{"key":"e_1_3_3_1_34_2","series-title":"(CONSEQUENCES \u201923)","volume-title":"CONSEQUENCES Workshop at ACM RecSys \u201923","author":"London Ben","year":"2023","unstructured":"Ben London, Alexander Buchholz, Giuseppe Di\u00a0Benedetto, Jan\u00a0Malte Lichtenberg, Yannik Stein, and Thorsten Joachims. 2023. Self-Normalized Off-Policy Estimators for Ranking. In CONSEQUENCES Workshop at ACM RecSys \u201923(CONSEQUENCES \u201923)."},{"key":"e_1_3_3_1_35_2","first-page":"103652","volume-title":"Advances in Neural Information Processing Systems","author":"Nie Allen","year":"2024","unstructured":"Allen Nie, Yash Chandak, Christina\u00a0J. Yuan, Anirudhan Badrinath, Yannis Flet-Berliac, and Emma Brunskill. 2024. OPERA: Automatic Offline Policy Evaluation with Re-weighted Aggregates of Multiple Estimators. In Advances in Neural Information Processing Systems , A.\u00a0Globerson, L.\u00a0Mackey, D.\u00a0Belgrave, A.\u00a0Fan, U.\u00a0Paquet, J.\u00a0Tomczak, and C.\u00a0Zhang (Eds.), Vol.\u00a037. Curran Associates, Inc., 103652\u2013103680."},{"key":"e_1_3_3_1_36_2","volume-title":"Monte Carlo theory, methods and examples","author":"Owen Art\u00a0B.","year":"2013","unstructured":"Art\u00a0B. Owen. 2013. Monte Carlo theory, methods and examples."},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","unstructured":"Karl Pearson. 1904. Report on Certain Enteric Fever Inoculation Statistics. BMJ 2 2288 (1904) 1243\u20131246. 10.1136\/bmj.2.2288.1243","DOI":"10.1136\/bmj.2.2288.1243"},{"key":"e_1_3_3_1_38_2","unstructured":"Fabian Pedregosa Ga\u00ebl Varoquaux Alexandre Gramfort Vincent Michel Bertrand Thirion Olivier Grisel Mathieu Blondel Peter Prettenhofer Ron Weiss Vincent Dubourg Jake Vanderplas Alexandre Passos David Cournapeau Matthieu Brucher Matthieu Perrot and \u00c9douard Duchesnay. 2011. Scikit-learn: Machine Learning in Python. Journal of Machine Learning Research 12 85 (2011) 2825\u20132830. http:\/\/jmlr.org\/papers\/v12\/pedregosa11a.html"},{"key":"e_1_3_3_1_39_2","volume-title":"RecSys REVEAL Workshop on Offline Evaluation for Recommender Systems","author":"Rohde David","year":"2018","unstructured":"David Rohde, Stephen Bonner, Travis Dunlop, Flavian Vasile, and Alexandros Karatzoglou. 2018. RecoGym: A Reinforcement Learning Environment for the problem of Product Recommendation in Online Advertising. In RecSys REVEAL Workshop on Offline Evaluation for Recommender Systems."},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/2959100.2959176"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/3616855.3635846"},{"key":"e_1_3_3_1_42_2","volume-title":"Proc. of the Neural Information Processing Systems Track on Datasets and Benchmarks","author":"Saito Yuta","year":"2021","unstructured":"Yuta Saito, Shunsuke Aihara, Megumi Matsutani, and Yusuke Narita. 2021. Open Bandit Dataset and Pipeline: Towards Realistic and Reproducible Off-Policy Evaluation. In Proc. of the Neural Information Processing Systems Track on Datasets and Benchmarks , Vol.\u00a01."},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"publisher","DOI":"10.1145\/3460231.3473320"},{"key":"e_1_3_3_1_44_2","series-title":"Proc. of Machine Learning Research","first-page":"9167","volume-title":"Proc. of the 37th International Conference on Machine Learning","volume":"119","author":"Su Yi","year":"2020","unstructured":"Yi Su, Maria Dimakopoulou, Akshay Krishnamurthy, and Miroslav Dudik. 2020. Doubly robust off-policy evaluation with shrinkage. In Proc. of the 37th International Conference on Machine Learning(Proc. of Machine Learning Research, Vol.\u00a0119). PMLR, 9167\u20139176. https:\/\/proceedings.mlr.press\/v119\/su20a.html"},{"key":"e_1_3_3_1_45_2","series-title":"Proc. of Machine Learning Research","first-page":"6005","volume-title":"Proc. of the 36th International Conference on Machine Learning","volume":"97","author":"Su Yi","year":"2019","unstructured":"Yi Su, Lequn Wang, Michele Santacatterina, and Thorsten Joachims. 2019. CAB: Continuous Adaptive Blending for Policy Evaluation and Learning. In Proc. of the 36th International Conference on Machine Learning(Proc. of Machine Learning Research, Vol.\u00a097). PMLR, 6005\u20136014."},{"key":"e_1_3_3_1_46_2","volume-title":"Advances in Neural Information Processing Systems","author":"Swaminathan Adith","year":"2015","unstructured":"Adith Swaminathan and Thorsten Joachims. 2015. The Self-Normalized Estimator for Counterfactual Learning. In Advances in Neural Information Processing Systems , Vol.\u00a028. Curran Associates, Inc."},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"crossref","unstructured":"Takuma Udagawa Haruka Kiyohara Yusuke Narita Yuta Saito and Kei Tateno. 2023. Policy-Adaptive Estimator Selection for Off-Policy Evaluation. Proc. of the AAAI Conference on Artificial Intelligence 37 8 (Jun. 2023) 10025\u201310033.","DOI":"10.1609\/aaai.v37i8.26195"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"publisher","DOI":"10.1145\/3340631.3398666"}],"event":{"name":"RecSys '25: Nineteenth ACM Conference on Recommender Systems","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction","SIGAI ACM Special Interest Group on Artificial Intelligence","SIGIR ACM Special Interest Group on Information Retrieval","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"Prague Czech Republic","acronym":"RecSys '25"},"container-title":["Proceedings of the Nineteenth ACM Conference on Recommender Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3705328.3759308","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T11:43:11Z","timestamp":1757158991000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3705328.3759308"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,7]]},"references-count":47,"alternative-id":["10.1145\/3705328.3759308","10.1145\/3705328"],"URL":"https:\/\/doi.org\/10.1145\/3705328.3759308","relation":{},"subject":[],"published":{"date-parts":[[2025,9,7]]},"assertion":[{"value":"2025-09-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}