{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,30]],"date-time":"2025-07-30T15:32:32Z","timestamp":1753889552884},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1109\/bigdata.2017.8257934","type":"proceedings-article","created":{"date-parts":[[2018,1,15]],"date-time":"2018-01-15T22:47:28Z","timestamp":1516056448000},"page":"263-272","source":"Crossref","is-referenced-by-count":8,"title":["Sanzu: A data science benchmark"],"prefix":"10.1109","author":[{"given":"Alex","family":"Watson","sequence":"first","affiliation":[]},{"given":"Deepigha Shree Vittal","family":"Babu","sequence":"additional","affiliation":[]},{"given":"Suprio","family":"Ray","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"journal-title":"The Transaction Processing Performance Council","year":"0","key":"ref30"},{"journal-title":"Apache Hadoop","year":"0","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.14778\/2367502.2367510"},{"journal-title":"The Fourth Paradigm Data-Intensive Scientific Discovery","year":"2009","author":"hey","key":"ref12"},{"journal-title":"Hockey stats","year":"0","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2611567"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3004295"},{"journal-title":"Matplotlib","year":"0","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.14778\/3137628.3137634"},{"journal-title":"NB Power","year":"0","key":"ref18"},{"journal-title":"Numpy scientific computing with Python","year":"0","key":"ref19"},{"journal-title":"Apache SPARK","year":"0","key":"ref28"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/5666.5673"},{"journal-title":"Scikit-learn Machine Learning in Python","year":"0","key":"ref27"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/BigData.2016.7840934"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2463712"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/2588555.2595633"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2017.167"},{"journal-title":"Graysort benchmark","year":"0","key":"ref8"},{"journal-title":"Historical Climate Data","year":"0","key":"ref7"},{"journal-title":"Dask","year":"0","key":"ref2"},{"key":"ref9","article-title":"Data Science from Scratch","author":"grus","year":"2015","journal-title":"O'Reilly Media Inc"},{"key":"ref1","first-page":"143","article-title":"Benchmarking Cloud Serving Systems with YCS B","author":"cooper","year":"2010","journal-title":"SOCC"},{"journal-title":"NYTimes article","year":"0","key":"ref20"},{"journal-title":"PostgreSQL","year":"0","key":"ref22"},{"journal-title":"Pandas Python Data Analysis Library","year":"0","key":"ref21"},{"journal-title":"The R Project for Statistical Computing","year":"0","key":"ref24"},{"journal-title":"Anaconda","year":"0","key":"ref23"},{"journal-title":"Doing Data Science Straight Talk from the Frontline","year":"2013","author":"schutt","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2011.5767929"}],"event":{"name":"2017 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2017,12,11]]},"location":"Boston, MA","end":{"date-parts":[[2017,12,14]]}},"container-title":["2017 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8241556\/8257893\/08257934.pdf?arnumber=8257934","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2018,2,28]],"date-time":"2018-02-28T21:53:31Z","timestamp":1519854811000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/8257934\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/bigdata.2017.8257934","relation":{},"subject":[],"published":{"date-parts":[[2017,12]]}}}