{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T20:47:07Z","timestamp":1757450827265,"version":"3.28.0"},"reference-count":48,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1109\/bigdata47090.2019.9006440","type":"proceedings-article","created":{"date-parts":[[2020,2,25]],"date-time":"2020-02-25T06:05:34Z","timestamp":1582610734000},"page":"583-592","source":"Crossref","is-referenced-by-count":3,"title":["CS*: Approximate Query Processing on Big Data using Scalable Join Correlated Sample Synopsis"],"prefix":"10.1109","author":[{"given":"Feng","family":"Yu","sequence":"first","affiliation":[{"name":"Youngstown State University,Department of Computer Science and Information Systems,Youngstown,OH,USA"}]},{"given":"Wen-Chi","family":"Hou","sequence":"additional","affiliation":[{"name":"Southern Illinois University,Department of Computer Science,Carbondale,IL,USA"}]}],"member":"263","reference":[{"journal-title":"Sampling Techniques","year":"1977","author":"cochran","key":"ref39"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/304181.304208"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.14778\/1687553.1687609"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2006.61"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/233269.233340"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"341","DOI":"10.1145\/141484.130335","article-title":"Sequential Sampling Procedures Query Size","author":"haas","year":"1992","journal-title":"Proc SIGMOD"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/253262.253291"},{"key":"ref36","first-page":"10","article-title":"Spark: Cluster Computing with Working Sets","author":"zaharia","year":"2010","journal-title":"Proc of HotCloud&#x2019;10"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/2723372.2742790"},{"journal-title":"Apache Hadoop","year":"2019","key":"ref34"},{"key":"ref10","first-page":"466","article-title":"Fast Incremental Maintenance of Approximate Histograms","author":"gibbons","year":"1997","journal-title":"Proc of VLDB&#x2019;97"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/1412331.1412335"},{"key":"ref11","first-page":"276","author":"hou","year":"1988","journal-title":"Statistical Estimators for Relational Algebra Expressions"},{"journal-title":"Random Sampling from Databases","year":"1993","author":"olken","key":"ref12"},{"key":"ref13","first-page":"311","article-title":"Sampling-Based Estimation of the Number of Distinct Estimation of Values of an Attribute","author":"haas","year":"1995","journal-title":"Proc of VLDB&#x2019;97"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2610513"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/2882903.2882914"},{"key":"ref16","first-page":"13","article-title":"Sketching Streams Through the Net: Distributed Approximate Query Tracking","author":"cormode","year":"2005","journal-title":"Proc of VLDB&#x2019;04"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/1386118.1386121"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/191839.191874"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/304181.304206"},{"key":"ref28","first-page":"5","article-title":"Approximate query answering using histograms","volume":"22","author":"poosala","year":"1999","journal-title":"IEEE Data Eng Bull"},{"key":"ref4","first-page":"240","article-title":"Selectivity Estimation and Query Optimization in Large Databases with Highly Skewed Distributions of Column Values","author":"lynch","year":"1988","journal-title":"Proc VLDB&#x2019;83"},{"journal-title":"Database Systems The Complete Book","year":"2008","author":"garcia-molina","key":"ref27"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/s41019-018-0074-4"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/582095.582099"},{"key":"ref29","first-page":"541","article-title":"Distinct Sampling for HighlyAccurate Answers to Distinct Values Queries and Event Reports","author":"gibbons","year":"2001","journal-title":"Proc VLDB&#x2019;1994"},{"key":"ref5","first-page":"1","article-title":"An Introduction to MCMC for Machine Learning","volume":"50","author":"andrieu","year":"2002","journal-title":"Machine Learning"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1145\/971701.50205","article-title":"Equi-Depth Histograms For Estimating Selectivity Factors For Multi-Dimensional Queries","author":"muralikrishna","year":"1988","journal-title":"Proc SIGMOD"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/234313.234367"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3056097"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/304181.304200"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1561\/1900000004"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2594532"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3035918.3035921"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.14778\/2336664.2336675"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/3267809.3267834"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/2882903.2915235"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3284551"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.14778\/2824032.2824051"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3196905"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2463701"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/2465351.2465355"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/304182.304207"},{"key":"ref44","article-title":"Cardinality Estimation Done Right: Index-Based Join Sampling","author":"leis","year":"2017","journal-title":"CIDR"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-23091-2_35"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3183739"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3147.3165"}],"event":{"name":"2019 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2019,12,9]]},"location":"Los Angeles, CA, USA","end":{"date-parts":[[2019,12,12]]}},"container-title":["2019 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8986695\/9005444\/09006440.pdf?arnumber=9006440","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,23]],"date-time":"2023-01-23T20:11:47Z","timestamp":1674504707000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9006440\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,12]]},"references-count":48,"URL":"https:\/\/doi.org\/10.1109\/bigdata47090.2019.9006440","relation":{},"subject":[],"published":{"date-parts":[[2019,12]]}}}