{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T00:05:21Z","timestamp":1776125121990,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":32,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,8,4]],"date-time":"2023-08-04T00:00:00Z","timestamp":1691107200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,8,6]]},"DOI":"10.1145\/3580305.3599933","type":"proceedings-article","created":{"date-parts":[[2023,8,4]],"date-time":"2023-08-04T18:13:58Z","timestamp":1691172838000},"page":"4068-4077","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":12,"title":["Yggdrasil Decision Forests: A Fast and Extensible Decision Forests Library"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-2736-2869","authenticated-orcid":false,"given":"Mathieu","family":"Guillame-Bert","sequence":"first","affiliation":[{"name":"Google, Zurich, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2469-8242","authenticated-orcid":false,"given":"Sebastian","family":"Bruch","sequence":"additional","affiliation":[{"name":"Pinecone, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-2663-9371","authenticated-orcid":false,"given":"Richard","family":"Stotz","sequence":"additional","affiliation":[{"name":"Google, Zurich, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-0403-3119","authenticated-orcid":false,"given":"Jan","family":"Pfeifer","sequence":"additional","affiliation":[{"name":"Google, Zurich, Switzerland"}]}],"member":"320","published-online":{"date-parts":[[2023,8,4]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"Tensorflow: A system for large-scale machine learning. In 12th {USENIX} Symposium on Operating Systems Design and Implementation ({OSDI} 16). 265--283.","author":"Abadi Mart\u00edn","year":"2016","unstructured":"Mart\u00edn Abadi, Paul Barham, Jianmin Chen, Zhifeng Chen, Andy Davis, Jeffrey Dean, Matthieu Devin, Sanjay Ghemawat, Geoffrey Irving, Michael Isard, et al. 2016. Tensorflow: A system for large-scale machine learning. In 12th {USENIX} Symposium on Operating Systems Design and Implementation ({OSDI} 16). 265--283."},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2013.73"},{"key":"e_1_3_2_2_3_1","volume-title":"Machine Learning","volume":"45","author":"Breiman L","year":"2001","unstructured":"L Breiman. 2001. Random Forests. Machine Learning , Vol. 45 (10 2001), 5--32."},{"key":"e_1_3_2_2_4_1","volume-title":"Classification and regression trees","author":"Breiman Leo","unstructured":"Leo Breiman, Jerome H Friedman, Richard A Olshen, and Charles J Stone. 1984. Classification and regression trees. Routledge."},{"key":"e_1_3_2_2_5_1","unstructured":"Sebastian Bruch Jan Pfeifer and Mathieu Guillame-bert. 2020. Learning Representations for Axis-Aligned Decision Forests through Input Perturbation."},{"key":"e_1_3_2_2_6_1","volume-title":"ECML PKDD Workshop: Languages for Data Mining and Machine Learning. 108--122","author":"Buitinck Lars","year":"2013","unstructured":"Lars Buitinck, Gilles Louppe, Mathieu Blondel, Fabian Pedregosa, Andreas Mueller, Olivier Grisel, Vlad Niculae, Peter Prettenhofer, Alexandre Gramfort, Jaques Grobler, Robert Layton, Jake VanderPlas, Arnaud Joly, Brian Holt, and Ga\u00ebl Varoquaux. 2013. API design for machine learning software: experiences from the scikit-learn project. In ECML PKDD Workshop: Languages for Data Mining and Machine Learning. 108--122."},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.1958.10501479"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1013203451"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","unstructured":"Mathieu Guillame-Bert Sebastian Bruch Petr Mitrichev Petr Mikheev and Jan Pfeifer. 2020. Modeling Text with Decision Forests using Categorical-Set Splits. https:\/\/doi.org\/10.48550\/ARXIV.2009.09991","DOI":"10.48550\/ARXIV.2009.09991"},{"key":"e_1_3_2_2_11_1","volume-title":"Exact Distributed Training: Random Forest with Billions of Examples. CoRR","author":"Guillame-Bert Mathieu","year":"2018","unstructured":"Mathieu Guillame-Bert and Olivier Teytaud. 2018. Exact Distributed Training: Random Forest with Billions of Examples. CoRR, Vol. abs\/1804.06755 (2018).[arXiv]1804.06755"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-020-2649-2"},{"key":"e_1_3_2_2_13_1","volume-title":"Lightgbm: A highly efficient gradient boosting decision tree. Advances in neural information processing systems","author":"Ke Guolin","year":"2017","unstructured":"Guolin Ke, Qi Meng, Thomas Finley, Taifeng Wang, Wei Chen, Weidong Ma, Qiwei Ye, and Tie-Yan Liu. 2017. Lightgbm: A highly efficient gradient boosting decision tree. Advances in neural information processing systems, Vol. 30 (2017), 3146--3154."},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330858"},{"key":"e_1_3_2_2_15_1","volume-title":"Jerome Friedman.","author":"Charles J.","year":"1984","unstructured":"Charles J. Stone R.A. Olshen Leo Breiman, Jerome Friedman. 1984. Classification and Regression Trees. Chapman and Hall\/CRC."},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"crossref","unstructured":"Pan Li Zhen Qin Xuanhui Wang and Don Metzler. 2019. Combining Decision Trees and Neural Networks for Learning-to-Rank in Personal Search.","DOI":"10.1145\/3292500.3330676"},{"key":"e_1_3_2_2_17_1","first-page":"18","article-title":"Classification and Regression by randomForest","volume":"2","author":"Liaw Andy","year":"2002","unstructured":"Andy Liaw and Matthew Wiener. 2002. Classification and Regression by randomForest. R News, Vol. 2, 3 (2002), 18--22.","journal-title":"R News"},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/2766462.2767733"},{"key":"e_1_3_2_2_19_1","volume-title":"Bazel build tool. https:\/\/bazel.build. [Online","author":"L\u00fctkebohle Ingo","year":"2022","unstructured":"Ingo L\u00fctkebohle. 2015. Bazel build tool. https:\/\/bazel.build. [Online; accessed 12-September-2022]."},{"key":"e_1_3_2_2_20_1","unstructured":"Richard Stotz Luiz GUStavo Martins Ashley Oldacre Jocelyn Becker Glenn Cameron Mathieu Guillame-Bert Jan Pfeifer. [n. d.]. Simple ML for Sheets. ([n. d.]). https:\/\/simplemlforsheets.com\/"},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-71273-4_44"},{"key":"e_1_3_2_2_22_1","volume-title":"Neural oblivious decision ensembles for deep learning on tabular data. arXiv preprint arXiv:1909.06312","author":"Popov Sergei","year":"2019","unstructured":"Sergei Popov, Stanislav Morozov, and Artem Babenko. 2019. Neural oblivious decision ensembles for deep learning on tabular data. arXiv preprint arXiv:1909.06312 (2019)."},{"key":"e_1_3_2_2_23_1","unstructured":"John Quinlan. 1994. C4. 5: Programs for machine learning."},{"key":"e_1_3_2_2_24_1","volume-title":"R: A Language and Environment for Statistical Computing","author":"Team R Core","year":"2022","unstructured":"R Core Team. 2022. R: A Language and Environment for Statistical Computing. R Foundation for Statistical Computing, Vienna, Austria. https:\/\/www.R-project.org\/"},{"key":"e_1_3_2_2_25_1","volume-title":"Empirical inference","author":"Schapire Robert E","unstructured":"Robert E Schapire. 2013. Explaining adaboost. In Empirical inference. Springer, 37--52."},{"key":"e_1_3_2_2_26_1","unstructured":"Haijia Shi. 2007. Best-first Decision Tree Learning."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/503271.503224"},{"key":"e_1_3_2_2_28_1","unstructured":"Beth Atkinson Terry Therneau and Brian Ripley. [n. d.]. rpart: Recursive Partitioning and Regression Trees. ( [n. d.]). https:\/\/CRAN.R-project.org\/package=rpart"},{"key":"e_1_3_2_2_29_1","article-title":"Sparse Projection Oblique Randomer Forests","volume":"21","author":"Tomita Tyler M.","year":"2020","unstructured":"Tyler M. Tomita, James Browne, Cencheng Shen, Jaewon Chung, Jesse L. Patsolic, Benjamin Falk, Carey E. Priebe, Jason Yim, Randal Burns, Mauro Maggioni, and Joshua T. Vogelstein. 2020. Sparse Projection Oblique Randomer Forests. J. Mach. Learn. Res., Vol. 21, 1, Article 104 (jan 2020), 39 pages.","journal-title":"J. Mach. Learn. Res."},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2641190.2641198"},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.25080\/Majora-92bf1922-00a"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.18637\/jss.v077.i01"}],"event":{"name":"KDD '23: The 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Long Beach CA USA","acronym":"KDD '23","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3580305.3599933","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3580305.3599933","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:37:42Z","timestamp":1750178262000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3580305.3599933"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,4]]},"references-count":32,"alternative-id":["10.1145\/3580305.3599933","10.1145\/3580305"],"URL":"https:\/\/doi.org\/10.1145\/3580305.3599933","relation":{},"subject":[],"published":{"date-parts":[[2023,8,4]]},"assertion":[{"value":"2023-08-04","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}