{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T10:16:00Z","timestamp":1770545760905,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":46,"publisher":"ACM","license":[{"start":{"date-parts":[[2016,6,14]],"date-time":"2016-06-14T00:00:00Z","timestamp":1465862400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Microsoft Jim Gray Systems Lab"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2016,6,14]]},"DOI":"10.1145\/2882903.2882952","type":"proceedings-article","created":{"date-parts":[[2016,6,16]],"date-time":"2016-06-16T19:01:52Z","timestamp":1466103712000},"page":"19-34","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":72,"title":["To Join or Not to Join?"],"prefix":"10.1145","author":[{"given":"Arun","family":"Kumar","sequence":"first","affiliation":[{"name":"University of Wisconsin-Madison, Madison, WI, USA"}]},{"given":"Jeffrey","family":"Naughton","sequence":"additional","affiliation":[{"name":"University of Wisconsin-Madison, Madison, WI, USA"}]},{"given":"Jignesh M.","family":"Patel","sequence":"additional","affiliation":[{"name":"University of Wisconsin-Madison, Madison, WI, USA"}]},{"given":"Xiaojin","family":"Zhu","sequence":"additional","affiliation":[{"name":"University of Wisconsin-Madison, Madison, WI, USA"}]}],"member":"320","published-online":{"date-parts":[[2016,6,14]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Feature Selection and Dimension Reduction Techniques in SAS. nesug.org\/Proceedings\/nesug11\/sa\/sa08.pdf.  Feature Selection and Dimension Reduction Techniques in SAS. nesug.org\/Proceedings\/nesug11\/sa\/sa08.pdf."},{"key":"e_1_3_2_1_2_1","unstructured":"Gartner Report on Analytics. gartner.com\/it\/page.jsp?id=1971516.  Gartner Report on Analytics. gartner.com\/it\/page.jsp?id=1971516."},{"key":"e_1_3_2_1_3_1","unstructured":"Oracle R Enterprise.  Oracle R Enterprise."},{"key":"e_1_3_2_1_4_1","unstructured":"SAS Report on Analytics. sas.com\/reg\/wp\/corp\/23876.  SAS Report on Analytics. sas.com\/reg\/wp\/corp\/23876."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.5555\/551350"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/891073"},{"key":"e_1_3_2_1_7_1","volume-title":"CIDR","author":"Anderson M.","year":"2013","unstructured":"M. Anderson : A Data System for Feature Engineering . In CIDR , 2013 . M. Anderson et al. Brainwash: A Data System for Feature Engineering. In CIDR, 2013."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/320064.320066"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2465283"},{"key":"e_1_3_2_1_10_1","volume-title":"NIPS","author":"Daniely A.","year":"2012","unstructured":"A. Daniely Multiclass Learning Approaches: A Theoretical Comparison with Implications . In NIPS , 2012 . A. Daniely et al. Multiclass Learning Approaches: A Theoretical Comparison with Implications. In NIPS, 2012."},{"key":"e_1_3_2_1_11_1","volume-title":"ICML","author":"Domingos P.","year":"2000","unstructured":"P. Domingos . A Unified Bias-Variance Decomposition and its Applications . In ICML , 2000 . P. Domingos. A Unified Bias-Variance Decomposition and its Applications. In ICML, 2000."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2347736.2347755"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007413511361"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.18637\/jss.v033.i01"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007465528199"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2011.5767930"},{"key":"e_1_3_2_1_17_1","volume-title":"Feature Extraction: Foundations and Applications","author":"Guyon I.","year":"2001","unstructured":"I. Guyon , S. Gunn , M. Nikravesh , and L. A. Zadeh . Feature Extraction: Foundations and Applications . New York : Springer-Verlag , 2001 . I. Guyon, S. Gunn, M. Nikravesh, and L. A. Zadeh. Feature Extraction: Foundations and Applications. New York: Springer-Verlag, 2001."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-21606-5"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.14778\/2367502.2367510"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2012.219"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(97)00043-X"},{"key":"e_1_3_2_1_22_1","volume-title":"ICML","author":"Koller D.","year":"1995","unstructured":"D. Koller and M. Sahami . Toward Optimal Feature Selection . In ICML , 1995 . D. Koller and M. Sahami. Toward Optimal Feature Selection. In ICML, 1995."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.14778\/2536274.2536302"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2009.263"},{"key":"e_1_3_2_1_25_1","volume-title":"CIDR","author":"Kraska T.","year":"2013","unstructured":"T. Kraska : A Distributed Machine-learning System . In CIDR , 2013 . T. Kraska et al. MLbase: A Distributed Machine-learning System. In CIDR, 2013."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/2428556.2428570"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2935694.2935698"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2723713"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.5555\/1394399"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.5555\/541177"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2213836.2213844"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.5555\/52121"},{"key":"e_1_3_2_1_34_1","volume-title":"AAAI","author":"Pearl J.","year":"1987","unstructured":"J. Pearl and T. Verma . The Logic of Representing Dependencies by Directed Graphs . In AAAI , 1987 . J. Pearl and T. Verma. The Logic of Representing Dependencies by Directed Graphs. In AAAI, 1987."},{"key":"e_1_3_2_1_35_1","volume-title":"Database Management Systems","author":"Ramakrishnan R.","year":"2003","unstructured":"R. Ramakrishnan and J. Gehrke . Database Management Systems . McGraw-Hill, Inc. , New York, NY, USA , 2003 . R. Ramakrishnan and J. Gehrke. Database Management Systems. McGraw-Hill, Inc., New York, NY, USA, 2003."},{"key":"e_1_3_2_1_36_1","volume-title":"Data Engineering Bulletin","author":"R\u00e9 C.","year":"2014","unstructured":"C. R\u00e9 Feature Engineering for Knowledge Base Construction . Data Engineering Bulletin , 2014 . C. R\u00e9 et al. Feature Engineering for Knowledge Base Construction. Data Engineering Bulletin, 2014."},{"key":"e_1_3_2_1_37_1","volume-title":"Introducing CloudLab: Scientific Infrastructure for Advancing Cloud Architectures and Applications. ;login:, 39(6)","author":"Ricci R.","year":"2014","unstructured":"R. Ricci , E. Eide , and the CloudLab Team. Introducing CloudLab: Scientific Infrastructure for Advancing Cloud Architectures and Applications. ;login:, 39(6) , 2014 . R. Ricci, E. Eide, and the CloudLab Team. Introducing CloudLab: Scientific Infrastructure for Advancing Cloud Architectures and Applications. ;login:, 39(6), 2014."},{"key":"e_1_3_2_1_38_1","volume-title":"ICML","author":"Rish I.","year":"2001","unstructured":"I. Rish An Analysis of Data Characteristics that Affect Naive Bayes Performance . In ICML , 2001 . I. Rish et al. An Analysis of Data Characteristics that Affect Naive Bayes Performance. In ICML, 2001."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/564376.564421"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781107298019"},{"key":"e_1_3_2_1_41_1","volume-title":"Database Systems Concepts","author":"Silberschatz A.","year":"2006","unstructured":"A. Silberschatz Database Systems Concepts . McGraw-Hill, Inc. , 2006 . A. Silberschatz et al. Database Systems Concepts. McGraw-Hill, Inc., 2006."},{"key":"e_1_3_2_1_42_1","volume-title":"A Novel Feature Selection Approach: Combining Feature Wrappers and Filters. Information Sciences, 177(2)","author":"Uncu O.","year":"2007","unstructured":"O. Uncu and I. Turksen . A Novel Feature Selection Approach: Combining Feature Wrappers and Filters. Information Sciences, 177(2) , 2007 . O. Uncu and I. Turksen. A Novel Feature Selection Approach: Combining Feature Wrappers and Filters. Information Sciences, 177(2), 2007."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.5555\/211359"},{"key":"e_1_3_2_1_44_1","volume-title":"UAI","author":"S. K.","year":"1995","unstructured":"S. K. M. Wong et al. A Method for Implementing a Probabilistic Model as a Relational Database . In UAI , 1995 . S. K. M. Wong et al. A Method for Implementing a Probabilistic Model as a Relational Database. In UAI, 1995."},{"key":"e_1_3_2_1_45_1","volume-title":"JMLR","author":"Yu L.","year":"2004","unstructured":"L. Yu and H. Liu . Efficient Feature Selection via Analysis of Relevance and Redundancy . JMLR , 5, Dec. 2004 . L. Yu and H. Liu. Efficient Feature Selection via Analysis of Relevance and Redundancy. JMLR, 5, Dec. 2004."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2593678"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2010.5447819"}],"event":{"name":"SIGMOD\/PODS'16: International Conference on Management of Data","location":"San Francisco California USA","acronym":"SIGMOD\/PODS'16","sponsor":["SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 2016 International Conference on Management of Data"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2882903.2882952","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2882903.2882952","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T19:04:29Z","timestamp":1750273469000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2882903.2882952"}},"subtitle":["Thinking Twice about Joins before Feature Selection"],"short-title":[],"issued":{"date-parts":[[2016,6,14]]},"references-count":46,"alternative-id":["10.1145\/2882903.2882952","10.1145\/2882903"],"URL":"https:\/\/doi.org\/10.1145\/2882903.2882952","relation":{},"subject":[],"published":{"date-parts":[[2016,6,14]]},"assertion":[{"value":"2016-06-14","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}