{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T21:58:35Z","timestamp":1775858315015,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,7,25]],"date-time":"2019-07-25T00:00:00Z","timestamp":1564012800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,7,25]]},"DOI":"10.1145\/3292500.3330858","type":"proceedings-article","created":{"date-parts":[[2019,7,26]],"date-time":"2019-07-26T13:17:26Z","timestamp":1564147046000},"page":"384-394","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":118,"title":["DeepGBM"],"prefix":"10.1145","author":[{"given":"Guolin","family":"Ke","sequence":"first","affiliation":[{"name":"Microsoft Research, Beijing, China"}]},{"given":"Zhenhui","family":"Xu","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}]},{"given":"Jia","family":"Zhang","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}]},{"given":"Jiang","family":"Bian","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}]},{"given":"Tie-Yan","family":"Liu","sequence":"additional","affiliation":[{"name":"Microsoft Research, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2019,7,25]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/1148170.1148177"},{"key":"e_1_3_2_1_2_1","volume-title":"Initializing neural networks using decision trees. Computational learning theory and natural learning systems","author":"Banerjee Arunava","year":"1997"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/34.709601"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.5555\/1756006.1756034"},{"key":"e_1_3_2_1_5_1","volume-title":"Neural random forests. Sankhya A","author":"Biau G\u00e9rard","year":"2016"},{"key":"e_1_3_2_1_6_1","first-page":"23","article-title":"From ranknet to lambdarank to lambdamart: An overview","volume":"11","author":"Burges Christopher JC","year":"2010","journal-title":"Learning"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/1273496.1273513"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2988450.2988454"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/2959100.2959190"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/347090.347107"},{"key":"e_1_3_2_1_12_1","volume-title":"CatBoost: gradient boosting with categorical features support. arXiv preprint arXiv:1810.11363","author":"Dorogush Anna Veronika","year":"2018"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/3091622.3091646"},{"key":"e_1_3_2_1_14_1","volume-title":"Multi-Layered Gradient Boosting Decision Trees. arXiv preprint arXiv:1806.00007","author":"Feng Ji","year":"2018"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.5555\/2627435.2697065"},{"key":"e_1_3_2_1_16_1","volume-title":"The elements of statistical learning","author":"Friedman Jerome"},{"key":"e_1_3_2_1_17_1","volume-title":"Greedy function approximation: a gradient boosting machine. Annals of statistics","author":"Friedman Jerome H","year":"2001"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/1083784.1083789"},{"key":"e_1_3_2_1_19_1","volume-title":"Deep learning","author":"Goodfellow Ian"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICHIS.2005.43"},{"key":"e_1_3_2_1_21_1","volume-title":"Thomas Borchert, and Ralf Herbrich.","author":"Graepel Thore","year":"2010"},{"key":"e_1_3_2_1_22_1","volume-title":"Deepfm: a factorization-machine based neural network for ctr prediction. arXiv preprint arXiv:1703.04247","author":"Guo Huifeng","year":"2017"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/2648584.2648589"},{"key":"e_1_3_2_1_24_1","volume-title":"Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531","author":"Hinton Geoffrey","year":"2015"},{"key":"e_1_3_2_1_25_1","volume-title":"Deep neural network initialization with decision trees. ArXiv e-prints (July","author":"Humbird K. D.","year":"2017"},{"key":"e_1_3_2_1_26_1","volume-title":"Decision forests, convolutional networks and the models in-between. arXiv preprint arXiv:1603.01250","author":"Ioannou Yani","year":"2016"},{"key":"e_1_3_2_1_27_1","volume-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift. arXiv preprint arXiv:1502.03167","author":"Ioffe Sergey","year":"2015"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956821"},{"key":"e_1_3_2_1_29_1","unstructured":"Guolin Ke Qi Meng Thomas Finley Taifeng Wang Wei Chen Weidong Ma Qiwei Ye and Tie-Yan Liu. 2017. LightGBM: A highly efficient gradient boosting decision tree. In Advances in Neural Information Processing Systems. 3146--3154.   Guolin Ke Qi Meng Thomas Finley Taifeng Wang Wei Chen Weidong Ma Qiwei Ye and Tie-Yan Liu. 2017. LightGBM: A highly efficient gradient boosting decision tree. In Advances in Neural Information Processing Systems. 3146--3154."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.172"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220033"},{"key":"e_1_3_2_1_32_1","volume-title":"xDeepFM: Combining Explicit and Implicit Feature Interactions for Recommender Systems. arXiv preprint arXiv:1803.05170","author":"Lian Jianxun","year":"2018"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3041021.3054192"},{"key":"e_1_3_2_1_34_1","unstructured":"Qi Meng Guolin Ke Taifeng Wang Wei Chen Qiwei Ye Zhi-Ming Ma and Tie-Yan Liu. 2016. A communication-efficient parallel algorithm for decision tree. In Advances in Neural Information Processing Systems. 1279--1287.   Qi Meng Guolin Ke Taifeng Wang Wei Chen Qiwei Ye Zhi-Ming Ma and Tie-Yan Liu. 2016. A communication-efficient parallel algorithm for decision tree. In Advances in Neural Information Processing Systems. 1279--1287."},{"key":"e_1_3_2_1_35_1","volume-title":"Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781","author":"Mikolov Tomas","year":"2013"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2016.0151"},{"key":"e_1_3_2_1_37_1","volume-title":"Guyon Isabelle, Hu Yi-Qi, Li Yu-Feng, Tu Wei-Wei, Yang Qiang, and Yu Yang.","author":"Quanming Yao","year":"2018"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2010.127"},{"key":"e_1_3_2_1_39_1","volume-title":"Relating cascaded random forests to deep convolutional neural networks for semantic segmentation. arXiv preprint arXiv:1507.07583","author":"Richmond David L","year":"2015"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.18"},{"key":"e_1_3_2_1_41_1","unstructured":"Scikit-learn. 2018. categorical_encoding. https:\/\/github.com\/scikit-learn-contrib\/categorical-encoding .  Scikit-learn. 2018. categorical_encoding. https:\/\/github.com\/scikit-learn-contrib\/categorical-encoding ."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/5.58346"},{"key":"e_1_3_2_1_43_1","unstructured":"Ira Shavitt and Eran Segal. 2018. Regularization Learning Networks: Deep Learning for Tabular Datasets. In Advances in Neural Information Processing Systems. 1386--1396.   Ira Shavitt and Eran Segal. 2018. Regularization Learning Networks: Deep Learning for Tabular Datasets. In Advances in Neural Information Processing Systems. 1386--1396."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.350"},{"key":"e_1_3_2_1_45_1","volume-title":"Feature selection using decision tree and classification through proximal support vector machine for fault diagnostics of roller bearing. Mechanical systems and signal processing","author":"Sugumaran V","year":"2007"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2783273"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611974973.1"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3219900"},{"key":"e_1_3_2_1_50_1","volume-title":"Irene Garcia Morillo, and Timothy M Hospedales","author":"Yang Yongxin","year":"2018"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-30671-1_4"},{"key":"e_1_3_2_1_52_1","volume-title":"Deep forest: Towards an alternative to deep neural networks. arXiv preprint arXiv:1702.08835","author":"Zhou Zhi-Hua","year":"2017"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/3097983.3098059"}],"event":{"name":"KDD '19: The 25th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Anchorage AK USA","acronym":"KDD '19","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330858","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3292500.3330858","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T00:26:02Z","timestamp":1750206362000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3292500.3330858"}},"subtitle":["A Deep Learning Framework Distilled by GBDT for Online Prediction Tasks"],"short-title":[],"issued":{"date-parts":[[2019,7,25]]},"references-count":53,"alternative-id":["10.1145\/3292500.3330858","10.1145\/3292500"],"URL":"https:\/\/doi.org\/10.1145\/3292500.3330858","relation":{},"subject":[],"published":{"date-parts":[[2019,7,25]]},"assertion":[{"value":"2019-07-25","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}