{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T13:45:39Z","timestamp":1765547139005,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":41,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,7,10]],"date-time":"2023-07-10T00:00:00Z","timestamp":1688947200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,7,10]]},"DOI":"10.1145\/3603719.3603744","type":"proceedings-article","created":{"date-parts":[[2023,8,27]],"date-time":"2023-08-27T06:09:45Z","timestamp":1693116585000},"page":"1-16","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Data Driven Dimensionality Reduction to Improve Modeling Performance\u2731"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-3293-3758","authenticated-orcid":false,"given":"Joshua","family":"Chung","sequence":"first","affiliation":[{"name":"Lawrence Berkeley National Laboratory, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4107-3797","authenticated-orcid":false,"given":"Marcos Lopez","family":"De Prado","sequence":"additional","affiliation":[{"name":"Lawrence Berkeley National Laboratory, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0832-3720","authenticated-orcid":false,"given":"Horst","family":"Simon","sequence":"additional","affiliation":[{"name":"ADIA Lab, United Arab Emirates"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6907-3393","authenticated-orcid":false,"given":"Kesheng","family":"Wu","sequence":"additional","affiliation":[{"name":"Berkeley Lab, USA"}]}],"member":"320","published-online":{"date-parts":[[2023,8,27]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330701"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2017.04.095"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cosrev.2021.100378"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2628071.2628092"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1090\/noti1105"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1002\/widm.1484"},{"volume-title":"Advances in financial machine learning","author":"de Prado Marcos\u00a0Lopez","key":"e_1_3_2_1_7_1","unstructured":"Marcos\u00a0Lopez de Prado. 2018. Advances in financial machine learning. John Wiley & Sons."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","unstructured":"Marcos\u00a0Lopez de Prado. 2020. Clustered feature importance (presentation slides). https:\/\/doi.org\/10.2139\/ssrn.3517595","DOI":"10.2139\/ssrn.3517595"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jspi.2011.09.016"},{"key":"e_1_3_2_1_10_1","volume-title":"Random walks in stock market prices. Financial analysts journal 51, 1","author":"Fama F","year":"1995","unstructured":"Eugene\u00a0F Fama. 1995. Random walks in stock market prices. Financial analysts journal 51, 1 (1995), 75\u201380."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICSESS.2016.7883053"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1142\/S0218001419500174"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1007\/s40747-021-00637-x"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01659-3_8"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1504\/IJBDI.2018.10008133"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.5555\/3122009.3242042"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-01970-8_89"},{"key":"e_1_3_2_1_18_1","first-page":"I","article-title":"A Unified Approach to Interpreting Model Predictions","volume":"30","author":"Lundberg M","year":"2017","unstructured":"Scott\u00a0M Lundberg and Su-In Lee. 2017. A Unified Approach to Interpreting Model Predictions. In Advances in Neural Information Processing Systems 30, I.\u00a0Guyon, U.\u00a0V. Luxburg, S.\u00a0Bengio, H.\u00a0Wallach, R.\u00a0Fergus, S.\u00a0Vishwanathan, and R.\u00a0Garnett (Eds.). Curran Associates, Inc., 4765\u20134774. http:\/\/papers.nips.cc\/paper\/7062-a-unified-approach-to-interpreting-model-predictions.pdf","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-022-01257-x"},{"key":"e_1_3_2_1_20_1","first-page":"66","article-title":"Dimensionality Reduction: a Comparative Review","volume":"10","author":"Van\u00a0Der Maaten Laurens","year":"2009","unstructured":"Laurens Van\u00a0Der Maaten, Eric Postma, Jaap\u00a0Van den Herik, 2009. Dimensionality Reduction: a Comparative Review. J Mach Learn Res 10, 66\u201371 (2009), 13.","journal-title":"J Mach Learn Res"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1016\/0098-3004(93)90090-R"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1080\/00031305.1982.10482818"},{"key":"e_1_3_2_1_23_1","volume-title":"UMAP: Uniform Manifold Approximation and Projection for Dimension Reduction. arXiv","author":"McInnes Leland","year":"2020","unstructured":"Leland McInnes and James Melville\u00a0John Healy. 2020. UMAP: Uniform Manifold Approximation and Projection for Dimension Reduction. arXiv (2020)."},{"key":"e_1_3_2_1_24_1","volume-title":"Evidence Contrary to the Statistical View of Boosting.Journal of Machine Learning Research 9, 2","author":"Mease David","year":"2008","unstructured":"David Mease and Abraham Wyner. 2008. Evidence Contrary to the Statistical View of Boosting.Journal of Machine Learning Research 9, 2 (2008)."},{"key":"e_1_3_2_1_25_1","volume-title":"How To Break Anonymity of the Netflix Prize Dataset. CoRR abs\/cs\/0610105","author":"Narayanan Arvind","year":"2006","unstructured":"Arvind Narayanan and Vitaly Shmatikov. 2006. How To Break Anonymity of the Netflix Prize Dataset. CoRR abs\/cs\/0610105 (2006). arxiv:cs\/0610105http:\/\/arxiv.org\/abs\/cs\/0610105"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1006907"},{"key":"e_1_3_2_1_27_1","unstructured":"Numerai. [n. d.]. Numerai Tournament Overview. https:\/\/docs.numer.ai\/tournament\/learn Accessed: 2021-09-21."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2019.2959988"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3054782"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41591-018-0272-7"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-020-09928-0"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2980942"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1126\/science.290.5500.2323"},{"volume-title":"Artificial Neural Networks \u2014 ICANN\u201997, Wulfram Gerstner, Alain Germond, Martin Hasler, and Jean-Daniel Nicoud (Eds.)","author":"Sch\u00f6lkopf Bernhard","key":"e_1_3_2_1_34_1","unstructured":"Bernhard Sch\u00f6lkopf, Alexander Smola, and Klaus-Robert M\u00fcller. 1997. Kernel principal component analysis. In Artificial Neural Networks \u2014 ICANN\u201997, Wulfram Gerstner, Alain Germond, Martin Hasler, and Jean-Daniel Nicoud (Eds.). Springer Berlin Heidelberg, Berlin, Heidelberg, 583\u2013588."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1126\/science.290.5500.2319"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1080\/01973533.2016.1277529"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0169-2070(03)00012-8"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.11578\/dc.20210521.74"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.07.061"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2010.05.007"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.38094\/jastt1224"}],"event":{"name":"SSDBM 2023: 35th International Conference on Scientific and Statistical Database Management","acronym":"SSDBM 2023","location":"Los Angeles CA USA"},"container-title":["35th International Conference on Scientific and Statistical Database Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3603719.3603744","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3603719.3603744","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T19:07:30Z","timestamp":1755889650000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3603719.3603744"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,10]]},"references-count":41,"alternative-id":["10.1145\/3603719.3603744","10.1145\/3603719"],"URL":"https:\/\/doi.org\/10.1145\/3603719.3603744","relation":{},"subject":[],"published":{"date-parts":[[2023,7,10]]},"assertion":[{"value":"2023-08-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}