{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T02:51:34Z","timestamp":1774320694872,"version":"3.50.1"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2019,5,6]],"date-time":"2019-05-06T00:00:00Z","timestamp":1557100800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["UID\/CEC\/00319\/2013"],"award-info":[{"award-number":["UID\/CEC\/00319\/2013"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["Funding Reference: POCI-01- 0247-FEDER-002814"],"award-info":[{"award-number":["Funding Reference: POCI-01- 0247-FEDER-002814"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1186\/s40537-019-0196-1","type":"journal-article","created":{"date-parts":[[2019,5,7]],"date-time":"2019-05-07T16:58:47Z","timestamp":1557248327000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":25,"title":["Evaluating partitioning and bucketing strategies for Hive-based Big Data Warehousing systems"],"prefix":"10.1186","volume":"6","author":[{"given":"Eduarda","family":"Costa","sequence":"first","affiliation":[]},{"given":"Carlos","family":"Costa","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3249-6229","authenticated-orcid":false,"given":"Maribel Yasmina","family":"Santos","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,5,6]]},"reference":[{"key":"196_CR1","unstructured":"Apache (2014) Apache Hadoop. \n                    http:\/\/hadoop.apache.org\/\n                    \n                  ."},{"key":"196_CR2","unstructured":"Capriolo E, Wampler D, Rutherglen J. Programming Hive. O\u2019Reilly Media, Inc. 2012."},{"key":"196_CR3","doi-asserted-by":"crossref","unstructured":"Cassavia N, Dicosta P, Masciari E, Sacc\u00e0 D. Data preparation for tourist Data Big Data Warehousing. In: Proceedings of 3rd international conference on data management technologies and applications (DATA). SciTePress, 2014. p. 419\u201326.","DOI":"10.5220\/0005144004190426"},{"key":"196_CR4","unstructured":"Chavalier M, El Malki M, Kopliku A, et al. Document-Oriented Data Warehouses: models and extended cuboids. In: 10th international conference on research challenges in information science (RCIS). IEEE, 2016. P. 1\u201311."},{"key":"196_CR5","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1007\/978-3-319-23135-8_6","volume-title":"Advances in Databases and Information Systems","author":"Max Chevalier","year":"2015","unstructured":"Chevalier M, El Malki M, Kopliku A, et al. Implementation of multidimensional databases in column-oriented NoSQL systems. In: East European conference on advances in databases and information systems. 2015. p. 79\u201391."},{"key":"196_CR6","doi-asserted-by":"crossref","unstructured":"Costa C, Santos MY. The SusCity big data warehousing approach for smart cities. In: Proceedings of the 21st international database engineering & applications symposium. 2017. p. 264\u201373.","DOI":"10.1145\/3105831.3105841"},{"key":"196_CR7","unstructured":"Costa C, Santos MY. Evaluating Several Design Patterns and Trends in Big Data Warehousing Systems. In J. Krogstie & H. A. Reijers (Eds.), Advanced Information Systems Engineering (Vol. 10816, pp. 459\u2013473). In: Proceedings of the 30th international conference on advanced information systems engineering (CAiSE\u20192018). Cham: Springer International Publishing; 2018."},{"key":"196_CR8","unstructured":"Costa E (2018) SSB Scripts. \n                    https:\/\/github.com\/EduardaCosta\/ScriptsSSB\n                    \n                  . Accessed 19 Dec 2018."},{"key":"196_CR9","first-page":"3","volume-title":"14th European, Mediterranean, and Middle Eastern Conference (EMCIS)","author":"E Costa","year":"2017","unstructured":"Costa E, Costa C, Santos MY. Efficient Big Data Modelling and Organization for Hadoop Hive-Based Data Warehouses. In: Themistocleous M, Morabito V, editors. 14th European, Mediterranean, and Middle Eastern Conference (EMCIS). Coimbra: Springer International Publishing; 2017. p. 3\u201316."},{"key":"196_CR10","doi-asserted-by":"crossref","unstructured":"Costa E, Costa C, Santos MY (2018) Partitioning and Bucketing in Hive-Based Big Data Warehouses. In: WorldCIST\u201918 - World Conference on Information Systems and Technologies. Springer International Publishing, pp 764\u2013774.","DOI":"10.1007\/978-3-319-77712-2_72"},{"key":"196_CR11","doi-asserted-by":"crossref","unstructured":"De Mauro A, Greco M, Grimaldi M. What is Big Data? A Consensual Definition and a Review of Key Research Topics. In: AIP conference proceedings. AIP Publishing; 2015. p. 97\u2013104.","DOI":"10.1063\/1.4907823"},{"key":"196_CR12","unstructured":"Dere J (2017) Apache Hive. \n                    https:\/\/cwiki.apache.org\/confluence\/display\/Hive\/Home\n                    \n                  ."},{"key":"196_CR13","doi-asserted-by":"publisher","first-page":"15","DOI":"10.4018\/IJDWM.2018010102","volume":"14","author":"F Di Tria","year":"2018","unstructured":"Di Tria F, Lefons E, Tangorra F. A framework for evaluating design methodologies for Big Data Warehouses: measurement of the design process. Int J Data Warehous Min. 2018;14:15\u201339. \n                    https:\/\/doi.org\/10.4018\/IJDWM.2018010102\n                    \n                  .","journal-title":"Int J Data Warehous Min"},{"key":"196_CR14","doi-asserted-by":"crossref","unstructured":"Di Tria F, Lefons E, Tangorra F. Design process for Big Data Warehouses. In: IEEE 2014 International conference on data science and advanced analytics (DSAA). 2014. p. 512\u201318.","DOI":"10.1109\/DSAA.2014.7058120"},{"key":"196_CR15","unstructured":"Du D. Apache Hive Essentials. Packt Publishing Ltd. 2015."},{"key":"196_CR16","unstructured":"Hortonworks I (2017) Hortonworks. \n                    https:\/\/hortonworks.com\n                    \n                  . Accessed 22 Oct 2017."},{"key":"196_CR17","unstructured":"Kimball R, Ross M. The Data Warehouse Toolkit: The Definitive Guide to Dimensional Modeling, 3 edn. New York: Wiley; 2013."},{"key":"196_CR18","doi-asserted-by":"crossref","unstructured":"Krishnan K (2013) Data Warehousing in the Age of Big Data. Elsevier Inc.","DOI":"10.1016\/B978-0-12-405891-0.00006-4"},{"key":"196_CR19","doi-asserted-by":"crossref","unstructured":"Kumar AS (2016) Performance analysis of MySQL Partition, Hive Partition-Bucketing and Apache Pig. In: Information Processing (IICIP), 2016 1st India International Conference. IEEE, p. 1\u20136.","DOI":"10.1109\/IICIP.2016.7975328"},{"key":"196_CR20","doi-asserted-by":"publisher","first-page":"237","DOI":"10.1007\/978-3-319-49944-4_18","volume-title":"International conference on research and practical issues of enterprise information systems","author":"B Martinho","year":"2016","unstructured":"Martinho B, Santos MY. An architecture for Data Warehousing in Big Data environments. International conference on research and practical issues of enterprise information systems. Cham: Springer; 2016. p. 237\u201350."},{"key":"196_CR21","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4302-4873-6","volume-title":"Big data imperatives: enterprise Big Data Warehouse, BI implementations and analytics","author":"S Mohanty","year":"2013","unstructured":"Mohanty S, Jagadeesh M, Srivatsa H. Big data imperatives: enterprise Big Data Warehouse, BI implementations and analytics. New York: Apress; 2013."},{"key":"196_CR22","unstructured":"O\u2019Neil P, O\u2019Neil B, Chen X. The star schema benchmark (SSB). 2007."},{"key":"196_CR23","doi-asserted-by":"publisher","first-page":"314","DOI":"10.1016\/j.ins.2014.01.015","volume":"275","author":"CL Philip Chen","year":"2014","unstructured":"Philip Chen CL, Zhang CY. Data-intensive applications, challenges, techniques and technologies: a survey on Big Data. Inf Sci. 2014;275:314\u201347. \n                    https:\/\/doi.org\/10.1016\/j.ins.2014.01.015\n                    \n                  .","journal-title":"Inf Sci"},{"key":"196_CR24","doi-asserted-by":"crossref","unstructured":"Pti\u010dek M, Vrdoljak B. Big Data and New Data Warehousing Approaches. In: Proceedings of the 2017 International Conference on Cloud and Big Data Computing. ACM, 2017. p. 6\u201310.","DOI":"10.1145\/3141128.3141139"},{"key":"196_CR25","unstructured":"Russom P. Evolving Data Warehouse Architectures in the Age of Big Data. 2014."},{"key":"196_CR26","doi-asserted-by":"crossref","unstructured":"Sandoval LJ. Design of business intelligence applications using big data technology. In: Central American and Panama Convention (CONCAPAN XXXV), 2015 IEEE Thirty Fifth. Institute of Electrical and Electronics Engineers Inc., 2016. p. 1\u20136.","DOI":"10.1109\/CONCAPAN.2015.7428454"},{"key":"196_CR27","doi-asserted-by":"crossref","unstructured":"Santos MY, Costa C (2016a) Data Warehousing in Big Data: from multidimensional to tabular data models. In: C3S2E\u201916\u2014Ninth international C* conference on computer science & software engineering. p. 10.","DOI":"10.1145\/2948992.2949024"},{"key":"196_CR28","doi-asserted-by":"crossref","first-page":"475","DOI":"10.1007\/978-3-319-40973-3_48","volume-title":"International Conference on Data Mining and Big Data","author":"MY Santos","year":"2016","unstructured":"Santos MY, Costa C. Data models in NoSQL databases for Big Data contexts. In: Tan Y, Shi Y, editors. International Conference on Data Mining and Big Data. Cham: Springer International Publishing; 2016. p. 475\u201385."},{"key":"196_CR29","doi-asserted-by":"crossref","unstructured":"Santos MY, Costa C, Galv\u00e3o J, et al. Evaluating SQL-on-Hadoop for Big Data Warehousing on not-so-good hardware. In: Proceedings of the 21st international database engineering & applications symposium. ACM, New York, NY, USA. 2017. p. 242\u201352.","DOI":"10.1145\/3105831.3105842"},{"key":"196_CR30","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4842-0271-5","volume-title":"Practical Hive: a guide to Hadoop\u2019s Data Warehouse System","author":"S Shaw","year":"2016","unstructured":"Shaw S, Vermeulen AF, Gupta A, Kjerrumgaard D. Practical Hive: a guide to Hadoop\u2019s Data Warehouse System. New York: Apress; 2016."},{"issue":"2","key":"196_CR31","doi-asserted-by":"publisher","first-page":"1626","DOI":"10.14778\/1687553.1687609","volume":"2","author":"Ashish Thusoo","year":"2009","unstructured":"Thusoo A, Sarma J Sen, Jain N, et al. Hive\u2014a Warehousing solution over a map-reduce framework. In: Proceedings of the VLDB endowment. 2009. p. 1626\u20139.","journal-title":"Proceedings of the VLDB Endowment"},{"key":"196_CR32","doi-asserted-by":"crossref","unstructured":"Thusoo A, Sen Sarma J, Jain N, et al. Hive\u2014a Petabyte Scale Data Warehouse using Hadoop. In: 2010 IEEE 26th international conference on Data Engineering (ICDE), 2010. p. 996\u20131005.","DOI":"10.1109\/ICDE.2010.5447738"},{"key":"196_CR33","unstructured":"TPC (2017a) TPC. \n                    http:\/\/www.tpc.org\/tpch\/\n                    \n                  ."},{"key":"196_CR34","unstructured":"TPC (2017b) TPC-H\u2014Homepage. \n                    http:\/\/www.tpc.org\/tpch\/\n                    \n                  . Accessed 16 Aug 2017."},{"key":"196_CR35","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1016\/j.procs.2016.08.138","volume":"96","author":"R Yangui","year":"2016","unstructured":"Yangui R, Nabli A, Gargouri F. Automatic transformation of data warehouse schema to NoSQL data base: comparative study. Procedia Comput Sci. 2016;96:255\u201364.","journal-title":"Procedia Comput Sci"},{"key":"196_CR36","volume-title":"Understanding Big Data: analytics for enterprise class hadoop and streaming data","author":"P Zikopoulos","year":"2011","unstructured":"Zikopoulos P, Eaton C. Understanding Big Data: analytics for enterprise class hadoop and streaming data. 1st ed. Delhi: McGraw-Hill Osborne Media; 2011.","edition":"1"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-019-0196-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s40537-019-0196-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-019-0196-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,4]],"date-time":"2020-05-04T23:08:14Z","timestamp":1588633694000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-019-0196-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,5,6]]},"references-count":36,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2019,12]]}},"alternative-id":["196"],"URL":"https:\/\/doi.org\/10.1186\/s40537-019-0196-1","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,5,6]]},"assertion":[{"value":"10 January 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 April 2019","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 May 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"34"}}