{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T22:25:22Z","timestamp":1740176722652,"version":"3.37.3"},"reference-count":22,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2019,6,25]],"date-time":"2019-06-25T00:00:00Z","timestamp":1561420800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2019,6,25]],"date-time":"2019-06-25T00:00:00Z","timestamp":1561420800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"name":"National Key R&D Program of China","award":["2018YFB1003404"],"award-info":[{"award-number":["2018YFB1003404"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61672141"],"award-info":[{"award-number":["61672141"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["N181605017"],"award-info":[{"award-number":["N181605017"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2020,4]]},"DOI":"10.1007\/s41060-019-00192-2","type":"journal-article","created":{"date-parts":[[2019,6,25]],"date-time":"2019-06-25T13:12:50Z","timestamp":1561468370000},"page":"273-284","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["PowerHash: a hybrid grouping scheme by leveraging power-law properties of data"],"prefix":"10.1007","volume":"9","author":[{"given":"Xun","family":"Wei","sequence":"first","affiliation":[]},{"given":"Xiaowang","family":"Kong","sequence":"additional","affiliation":[]},{"given":"Yanfeng","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Ge","family":"Yu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,6,25]]},"reference":[{"key":"192_CR1","doi-asserted-by":"crossref","unstructured":"Adamic, L.: The nature of markets in the world wide web. Quarterly J. Electron. Commer. 1(1) (2000)","DOI":"10.2139\/ssrn.166108"},{"key":"192_CR2","doi-asserted-by":"crossref","unstructured":"Agrawal, S., Chaudhuri, S., Kollar, L., Marathe, A., Narasayya, V., Syamala, M.: Database tuning advisor for microsoft SQL server 2005: demo. In: ACM SIGMOD International Conference on Management of Data (SIGMOD 2005), pp. 930\u2013932. ACM (2005)","DOI":"10.1145\/1066157.1066292"},{"issue":"10","key":"192_CR3","first-page":"2014","volume":"7","author":"D Bartholomew","year":"2012","unstructured":"Bartholomew, D.: Mariadb vs. MYSQL. Dostopano 7(10), 2014 (2012)","journal-title":"Dostopano"},{"key":"192_CR4","doi-asserted-by":"crossref","unstructured":"Boicea, A., Radulescu, F., Agapin, L.I.: Mongodb vs oracle-database comparison. In: EIDWT 2012, pp. 330\u2013335 (2012)","DOI":"10.1109\/EIDWT.2012.32"},{"key":"192_CR5","first-page":"323","volume":"1984","author":"K Bratbergsengen","year":"1984","unstructured":"Bratbergsengen, K.: Hashing methods and relational algebra operations. VLDB 1984, 323\u2013333 (1984)","journal-title":"VLDB"},{"issue":"1","key":"192_CR6","first-page":"64","volume":"29","author":"G Cormode","year":"2009","unstructured":"Cormode, G.: Count-min sketch. Encycl. Algorithms 29(1), 64\u201369 (2009)","journal-title":"Encycl. Algorithms"},{"key":"192_CR7","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1007\/978-3-540-24698-5_7","volume-title":"LATIN 2004: Theoretical Informatics","author":"G Cormode","year":"2004","unstructured":"Cormode, G., Muthukrishnan, S.: An improved data stream summary: the count-min sketch and its applications. In: Farach-Colton, M. (ed.) LATIN 2004: Theoretical Informatics, pp. 29\u201338. Springer, Berlin (2004)"},{"issue":"1","key":"192_CR8","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: Mapreduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013113 (2008)","journal-title":"Commun. ACM"},{"key":"192_CR9","unstructured":"Freedman, C.: Hash aggregate (2006). \nhttps:\/\/blogs.msdn.microsoft.com\/craigfr\/2006\/09\/20\/hash-aggregate\/\n\n. Accessed 2018"},{"key":"192_CR10","volume-title":"Human Behavior and the Principle of Least Effort: An Introduction to Human Ecology","author":"K George","year":"1949","unstructured":"George, K., George, K.: Human Behavior and the Principle of Least Effort: An Introduction to Human Ecology. Addison-Wesley Press, Boston (1949)"},{"issue":"1","key":"192_CR11","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1023\/A:1009726021843","volume":"1","author":"J Gray","year":"1997","unstructured":"Gray, J., Chaudhuri, S., Bosworth, A., Layman, A., Reichart, D., Venkatrao, M., Pellow, F., Pirahesh, H.: Data cube: a relational aggregation operator generalizing group-by, cross-tab, and sub-totals. Data Min. Knowl. Discov. 1(1), 29\u201353 (1997)","journal-title":"Data Min. Knowl. Discov."},{"key":"192_CR12","first-page":"1","volume":"1","author":"R Khattree","year":"2018","unstructured":"Khattree, R., Bahuguna, M.: An alternative data analytic approach to measure the univariate and multivariate skewness. Int. J. Data Sci. Anal. 1, 1\u201316 (2018)","journal-title":"Int. J. Data Sci. Anal."},{"key":"192_CR13","doi-asserted-by":"crossref","unstructured":"Li, B., Mazur, E., Diao, Y., Mcgregor, A., Shenoy, P.: A platform for scalable one-pass analytics using mapreduce. In: ACM SIGMOD International Conference on Management of Data (SIGMOD 2011), pp. 985\u2013996 (2011)","DOI":"10.1145\/1989323.1989426"},{"key":"192_CR14","first-page":"1318","volume":"2011","author":"L Lin","year":"2011","unstructured":"Lin, L., Lychagina, V., Liu, W., Kwon, Y., Mittal, S., Wong, M.: Tenzing a SQL implementation on the mapreduce framework. PVLDB 2011, 1318\u20131327 (2011)","journal-title":"PVLDB"},{"key":"192_CR15","volume-title":"PostgreSQL: Introduction and Concepts","author":"B Momjian","year":"2001","unstructured":"Momjian, B.: PostgreSQL: Introduction and Concepts, vol. 192. Addison-Wesley, New York (2001)"},{"key":"192_CR16","unstructured":"MySQL, A.: Mysql 5.1 reference manual, 2006 (2009). \nhttp:\/\/dev.mysql.com\/doc\n\n. Accessed 2018"},{"key":"192_CR17","doi-asserted-by":"crossref","unstructured":"Nasir, M.A.U., Morales, G.D.F., Garc\u00eda-Soriano, D., Kourtellis, N., Serafini, M.: The power of both choices: Practical load balancing for distributed stream processing engines. In: IEEE 31st International Conference on Data Engineering (ICDE 2015), pp. 137\u2013148. IEEE (2015)","DOI":"10.1109\/ICDE.2015.7113279"},{"issue":"5","key":"192_CR18","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1080\/00107510500052444","volume":"46","author":"M Newman","year":"2005","unstructured":"Newman, M.: Power laws, pareto distributions and zipf\u2019s law. Contemp. Phys. 46(5), 323\u2013351 (2005)","journal-title":"Contemp. Phys."},{"key":"192_CR19","doi-asserted-by":"crossref","unstructured":"Shvachko, K., Kuang, H., Radia, S., Chansler, R.: The hadoop distributed file system. In: IEEE Symposium on Mass storage systems and technologies (MSST 2010), pp. 1\u201310. IEEE (2010)","DOI":"10.1109\/MSST.2010.5496972"},{"issue":"1","key":"192_CR20","first-page":"D675","volume":"33","author":"SM Stephens","year":"2005","unstructured":"Stephens, S.M., Chen, J.Y., Davidson, M.G., Thomas, S., Trute, B.M.: Oracle database 10g: a platform for blast search and regular expression pattern matching in life sciences. Nucleic Acids Res. 33(1), D675\u2013D679 (2005)","journal-title":"Nucleic Acids Res."},{"key":"192_CR21","doi-asserted-by":"publisher","unstructured":"Teffer, D., Srinivasan, R., Ghosh, J.: Adahash: hashing-based scalable, adaptive hierarchical clustering of streaming data on mapreduce frameworks. Int. J. Data Sci. Anal. 1\u201311, (2018). \nhttps:\/\/doi.org\/10.1007\/s41060-018-0145-7","DOI":"10.1007\/s41060-018-0145-7"},{"key":"192_CR22","doi-asserted-by":"crossref","unstructured":"Yu, Y., Gunda, P.K., Isard, M.: Distributed aggregation for data-parallel computing: interfaces and implementations. In: ACM SIGOPS 22nd Symposium on Operating Systems Principles (SOSP 2009), pp. 247\u2013260. ACM (2009)","DOI":"10.1145\/1629575.1629600"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-019-00192-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s41060-019-00192-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-019-00192-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,6,23]],"date-time":"2020-06-23T23:06:41Z","timestamp":1592953601000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s41060-019-00192-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,6,25]]},"references-count":22,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2020,4]]}},"alternative-id":["192"],"URL":"https:\/\/doi.org\/10.1007\/s41060-019-00192-2","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2019,6,25]]},"assertion":[{"value":"20 January 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 June 2019","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 June 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}