{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T13:15:02Z","timestamp":1774358102082,"version":"3.50.1"},"publisher-location":"Cham","reference-count":50,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030703691","type":"print"},{"value":"9783030703707","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-70370-7_6","type":"book-chapter","created":{"date-parts":[[2021,2,19]],"date-time":"2021-02-19T23:37:06Z","timestamp":1613777826000},"page":"105-117","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Chapter 6 Big Data and FAIR Data for Data Science"],"prefix":"10.1007","author":[{"given":"Alexei","family":"Gvishiani","sequence":"first","affiliation":[]},{"given":"Michael","family":"Dobrovolsky","sequence":"additional","affiliation":[]},{"given":"Alena","family":"Rybkina","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,2,20]]},"reference":[{"key":"6_CR1","unstructured":"Lohr, S.: The Origins of \u2018Big Data': An Etymological Detective Story. The New York Times (2013). https:\/\/bits.blogs.nytimes.com\/2013\/02\/01\/the-origins-of-big-data-an-etymological-detective-story\/"},{"key":"6_CR2","first-page":"1","volume":"7","author":"C Snijders","year":"2012","unstructured":"Snijders, C., Matzat, U., Reips, U.-D.: \u201cBig Data\u201d: big gaps of knowledge in the field of internet science. Int. J. Internet Sci. 7, 1\u20135 (2012)","journal-title":"Int. J. Internet Sci."},{"key":"6_CR3","series-title":"Lecture Notes in Business Information Processing","doi-asserted-by":"publisher","first-page":"114","DOI":"10.1007\/978-3-319-58801-8_10","volume-title":"Innovations in Enterprise Information Systems Management and Engineering","author":"N Dedi\u0107","year":"2017","unstructured":"Dedi\u0107, N., Stanier, C.: Towards differentiating business intelligence, big data, data analytics and knowledge discovery. In: Piazolo, F., Geist, V., Brehm, L., Schmidt, R. (eds.) ERP Future 2016. LNBIP, vol. 285, pp. 114\u2013122. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-58801-8_10"},{"key":"6_CR4","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.is.2014.07.006","volume":"47","author":"IAT Hashem","year":"2015","unstructured":"Hashem, I.A.T., Yaqoob, I., Anuar, N.B., Mokhtar, S., Gani, A., Khan, S.U.: The rise of \u201cbig data\u201d on cloud computing: review and open research issues. Inf. Syst. 47, 98\u2013115 (2015). https:\/\/doi.org\/10.1016\/j.is.2014.07.006","journal-title":"Inf. Syst."},{"key":"6_CR5","unstructured":"Grimes, S.: Big Data: Avoid \u2018Wanna V\u2019 Confusion. InformationWeek (2013). https:\/\/www.informationweek.com\/big-data\/big-data-analytics\/big-data-avoid-wanna-v-confusion\/d\/d-id\/1111077"},{"key":"6_CR6","doi-asserted-by":"publisher","unstructured":"Fox, C.: Data Science for Transport. Springer Textbooks in Earth Sciences, Geography and Environment. Springer, Cham (2018). doi: https:\/\/doi.org\/10.1007\/978-3-319-72953-4","DOI":"10.1007\/978-3-319-72953-4"},{"key":"6_CR7","doi-asserted-by":"publisher","first-page":"382","DOI":"10.1108\/JFRC-06-2017-0054","volume":"26","author":"C Onay","year":"2018","unstructured":"Onay, C., \u00d6zt\u00fcrk, E.: A review of credit scoring research in the age of Big Data. J. Financ. Regul. Compliance. 26, 382\u2013405 (2018). https:\/\/doi.org\/10.1108\/JFRC-06-2017-0054","journal-title":"J. Financ. Regul. Compliance."},{"issue":"1","key":"6_CR8","doi-asserted-by":"publisher","first-page":"205395171663113","DOI":"10.1177\/2053951716631130","volume":"3","author":"R Kitchin","year":"2016","unstructured":"Kitchin, R., McArdle, G.: What makes Big Data, Big Data? Exploring the ontological characteristics of 26 datasets. Big Data Soc. 3(1), 2053951716631130 (2016). https:\/\/doi.org\/10.1177\/2053951716631130","journal-title":"Big Data Soc."},{"key":"6_CR9","doi-asserted-by":"publisher","unstructured":"NIST Big Data Interoperability Framework, vol. 1, Definitions. Version 3. NIST Special Publication 1500\u20131r2 (2019). https:\/\/doi.org\/10.6028\/NIST.SP.1500-1r2","DOI":"10.6028\/NIST.SP.1500-1r2"},{"key":"6_CR10","first-page":"602","volume":"4","author":"D Usha","year":"2014","unstructured":"Usha, D., Aps, J.A.: A survey of Big Data processing in perspective of Hadoop and MapReduce. Int. J. Curr. Eng. Technol. 4, 602\u2013606 (2014)","journal-title":"Int. J. Curr. Eng. Technol."},{"key":"6_CR11","volume-title":"Hadoop: The Definitive Guide","author":"T White","year":"2012","unstructured":"White, T.: Hadoop: The Definitive Guide. O\u2019Reilly Media Inc., United States (2012)"},{"key":"6_CR12","first-page":"1399","volume":"2","author":"NN Mall","year":"2016","unstructured":"Mall, N.N., Rana, S.: Overview of Big Data and Hadoop. Imperial J. Interdisc. Res. 2, 1399\u20131406 (2016)","journal-title":"Imperial J. Interdisc. Res."},{"key":"6_CR13","doi-asserted-by":"publisher","first-page":"45","DOI":"10.14257\/ijdta.2016.9.1.05","volume":"9","author":"BR Prasad","year":"2016","unstructured":"Prasad, B.R., Agarwal, S.: Comparative study of Big Data computing and storage tools: a review. Int. J. Database Theory Appl. 9, 45\u201366 (2016)","journal-title":"Int. J. Database Theory Appl."},{"key":"6_CR14","volume-title":"HBase in Action","author":"N Dimiduk","year":"2013","unstructured":"Dimiduk, N., Khurana, A., Ryan, M.H., Stack, M.: HBase in Action. Manning, Shelter Island (2013)"},{"issue":"1","key":"6_CR15","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1007\/s11192-016-1945-y","volume":"109","author":"IAT Hashem","year":"2016","unstructured":"Hashem, I.A.T., Anuar, N.B., Gani, A., Yaqoob, I., Xia, F., Khan, S.U.: MapReduce: review and open challenges. Scientometrics 109(1), 389\u2013422 (2016). https:\/\/doi.org\/10.1007\/s11192-016-1945-y","journal-title":"Scientometrics"},{"key":"6_CR16","doi-asserted-by":"crossref","unstructured":"Chen, X., Hu, L., Liu, L., Chang, J., Bone, D.L.: Breaking down Hadoop distributed file systems data analytics tools: apache Hive vs. Apache Pig vs. pivotal HWAQ. In: 2017 IEEE 10th International Conference on Cloud Computing (CLOUD), pp. 794\u2013797. IEEE (2017)","DOI":"10.1109\/CLOUD.2017.117"},{"key":"6_CR17","doi-asserted-by":"publisher","first-page":"271","DOI":"10.14445\/22315381\/IJETT-V50P244","volume":"50","author":"C Swarna","year":"2017","unstructured":"Swarna, C., Ansari, Z.: Apache Pig - a data flow framework based on Hadoop Map Reduce. Int. J. Eng. Trends Technol. 50, 271\u2013275 (2017)","journal-title":"Int. J. Eng. Trends Technol."},{"key":"6_CR18","volume-title":"Programming Pig: Dataflow Scripting with Hadoop","author":"A Gates","year":"2016","unstructured":"Gates, A., Dai, D.: Programming Pig: Dataflow Scripting with Hadoop. O\u2019Reilly Media Inc., United States (2016)"},{"key":"6_CR19","doi-asserted-by":"publisher","unstructured":"Singh, N., Agrawal, S.: A performance analysis of high-level MapReduce query languages in Big Data. In: Proceedings of the International Congress on Information and Communication Technology, pp. 551\u2013558. Springer, Singapore (2016). https:\/\/doi.org\/10.1007\/978-981-10-0767-5_57","DOI":"10.1007\/978-981-10-0767-5_57"},{"key":"6_CR20","doi-asserted-by":"crossref","unstructured":"Camacho-Rodr\u00edguez, J., et al.: Apache Hive: From Mapreduce to enterprise-grade Big Data warehousing. In: Proceedings of the 2019 International Conference on Management of Data, pp. 1773\u20131786 (2019)","DOI":"10.1145\/3299869.3314045"},{"key":"6_CR21","unstructured":"Pen, H.D., Dsilva, P., Mascarnes, S.: Comparing HiveQL and MapReduce methods to process fact data in a data warehouse. In: 2017 2nd International Conference on Communication Systems, Computing and IT Applications (CSCITA), pp. 201\u2013206. IEEE (2017)"},{"key":"6_CR22","doi-asserted-by":"crossref","unstructured":"Vohra, D.: Using apache sqoop. In: Pro Docker, pp. 151\u2013183. Apress, Berkeley, CA (2016)","DOI":"10.1007\/978-1-4842-1830-3_11"},{"key":"6_CR23","first-page":"21","volume":"5","author":"EL Lydia","year":"2016","unstructured":"Lydia, E.L., Swarup, M.B.: Analysis of Big Data through Hadoop ecosystem components like flume mapreduce, pig and hive. Int. J. Comput. Sci. Eng. 5, 21\u201329 (2016)","journal-title":"Int. J. Comput. Sci. Eng."},{"key":"6_CR24","first-page":"557","volume":"5","author":"S Mehta","year":"2016","unstructured":"Mehta, S., Mehta, V.: Hadoop ecosystem: an introduction. IJSR. 5, 557\u2013562 (2016)","journal-title":"Hadoop ecosystem: an introduction. IJSR."},{"key":"6_CR25","volume-title":"Mastering Apache Storm: Real-time Big Data Streaming using Kafka","author":"A Jain","year":"2017","unstructured":"Jain, A.: Mastering Apache Storm: Real-time Big Data Streaming using Kafka. Packt Publishing Ltd., Hbase and Redis (2017)"},{"key":"6_CR26","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1145\/2934664","volume":"59","author":"M Zaharia","year":"2016","unstructured":"Zaharia, M., et al.: Apache Spark: a unified engine for Big Data processing. Commun. ACM 59, 56\u201365 (2016)","journal-title":"Commun. ACM"},{"key":"6_CR27","doi-asserted-by":"crossref","unstructured":"Jayaratne, M., Alahakoon, D., De Silva, D., Yu, X.: Apache Spark based distributed self-organizing map algorithm for sensor data analysis. In: IECON 2017\u201343rd Annual Conference of the IEEE Industrial Electronics Society, pp. 8343\u20138349. IEEE (2017)","DOI":"10.1109\/IECON.2017.8217465"},{"key":"6_CR28","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4842-3579-9","volume-title":"Beginning Apache Spark 2: With Resilient Distributed Datasets, Spark Sql, Structured Streaming, and Spark Machine Learning Library","author":"H Luu","year":"2018","unstructured":"Luu, H.: Beginning Apache Spark 2: With Resilient Distributed Datasets, Spark Sql, Structured Streaming, and Spark Machine Learning Library. Apress, Berkeley (2018)"},{"key":"6_CR29","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1007\/978-1-4842-2337-6_7","volume-title":"Beginning Apache Pig","author":"B Vaddeman","year":"2016","unstructured":"Vaddeman, B.: HCatalog. In: Beginning Apache Pig, pp. 103\u2013113. Apress, Berkeley, CA (2016). https:\/\/doi.org\/10.1007\/978-1-4842-2337-6_7"},{"key":"6_CR30","volume-title":"Apache Mahout: Beyond MapReduce","author":"D Lyubimov","year":"2016","unstructured":"Lyubimov, D., Palumbo, A.: Apache Mahout: Beyond MapReduce. CreateSpace Independent Publishing Platform, United States (2016)"},{"key":"6_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.bdr.2016.10.002","volume":"8","author":"D Schmidt","year":"2017","unstructured":"Schmidt, D., Chen, W.C., Matheson, M.A., Ostrouchov, G.: Programming with BIG data in R: scaling analytics from one to thousands of nodes. Big Data Res. 8, 1\u20131 (2017)","journal-title":"Big Data Res."},{"key":"6_CR32","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.bdr.2018.04.004","volume":"14","author":"R Elshawi","year":"2018","unstructured":"Elshawi, R., Sakr, S., Talia, D., Trunfio, P.: Big data systems meet machine learning challenges: towards Big Data science as a service. Big data Res. 14, 1\u20131 (2018)","journal-title":"Big data Res."},{"key":"6_CR33","volume-title":"Apache Zookeeper Essentials","author":"S Haloi","year":"2015","unstructured":"Haloi, S.: Apache Zookeeper Essentials. Packt Publishing Ltd., United Kingdom (2015)"},{"key":"6_CR34","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/978-1-4842-2199-0_7","volume-title":"Practical Hadoop Ecosystem","author":"D Vohra","year":"2016","unstructured":"Vohra, D.: Apache Avro. In: Practical Hadoop Ecosystem, pp. 303\u2013323. Apress, Berkeley, CA (2016). https:\/\/doi.org\/10.1007\/978-1-4842-2199-0_7"},{"key":"6_CR35","volume-title":"Apache Oozie: The Workflow Scheduler for Hadoop","author":"MK Islam","year":"2015","unstructured":"Islam, M.K., Srinivasan, A.: Apache Oozie: The Workflow Scheduler for Hadoop. O\u2019Reilly Media Inc., United States (2015)"},{"key":"6_CR36","doi-asserted-by":"publisher","first-page":"399","DOI":"10.1007\/978-1-4302-4864-4_20","volume-title":"Pro Apache Hadoop","author":"S Wadkar","year":"2014","unstructured":"Wadkar, S., Siddalingaiah, M.: Apache Ambari. In: Pro Apache Hadoop, pp. 399\u2013401. Apress, Berkeley, CA (2014). https:\/\/doi.org\/10.1007\/978-1-4302-4864-4_20"},{"key":"6_CR37","series-title":"Studies in Big Data","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1007\/978-981-10-8476-8_5","volume-title":"Big Data in Engineering Applications","author":"A Saxena","year":"2018","unstructured":"Saxena, A., Singh, S., Shakya, C.: Concepts of HBase archetypes in Big Data engineering. In: Roy, S.S., Samui, P., Deo, R., Ntalampiras, S. (eds.) Big Data in Engineering Applications. SBD, vol. 44, pp. 83\u2013111. Springer, Singapore (2018). https:\/\/doi.org\/10.1007\/978-981-10-8476-8_5"},{"key":"6_CR38","doi-asserted-by":"crossref","unstructured":"Sirisha, N., Kiran, K.V.D.: Stock exchange analysis using Hadoop user experience (Hue). In: 2017 International Conference on Intelligent Sustainable Systems (ICISS), pp. 1141\u20131144. IEEE (2017)","DOI":"10.1109\/ISS1.2017.8389363"},{"key":"6_CR39","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1089\/big.2014.0064","volume":"4","author":"F Ofli","year":"2016","unstructured":"Ofli, F., et al.: Combining human computing and machine learning to make sense of big (aerial) data for disaster response. Big Data. 4, 47\u201359 (2016). https:\/\/doi.org\/10.1089\/big.2014.0064","journal-title":"Big Data."},{"issue":"5","key":"6_CR40","doi-asserted-by":"publisher","first-page":"651","DOI":"10.1007\/s11036-013-0456-9","volume":"18","author":"D Chen","year":"2013","unstructured":"Chen, D., Liu, Z., Wang, L., Dou, M., Chen, J., Li, H.: Natural disaster monitoring with wireless sensor networks: a case study of data-intensive applications upon low-cost scalable systems. Mob. Netw. Appl. 18(5), 651\u2013663 (2013). https:\/\/doi.org\/10.1007\/s11036-013-0456-9","journal-title":"Mob. Netw. Appl."},{"key":"6_CR41","doi-asserted-by":"publisher","first-page":"1072","DOI":"10.1002\/qj.2396","volume":"141","author":"C MacLachlan","year":"2015","unstructured":"MacLachlan, C., et al.: Global seasonal forecast system version 5 (GloSea5): a high-resolution seasonal forecast system. Q. J. R. Meteorol. Soc. 141, 1072\u20131084 (2015). https:\/\/doi.org\/10.1002\/qj.2396","journal-title":"Q. J. R. Meteorol. Soc."},{"key":"6_CR42","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/978-3-662-45960-7_19","volume-title":"AI Approaches to the Complexity of Legal Systems","author":"M Poblet","year":"2014","unstructured":"Poblet, M., Garc\u00eda-Cuesta, E., Casanovas, P.: Crowdsourcing tools for disaster management: a review of platforms and methods. In: Casanovas, P., Pagallo, U., Palmirani, M., Sartor, G. (eds.) AI Approaches to the Complexity of Legal Systems, pp. 261\u2013274. Springer, Heidelberg (2014)"},{"key":"6_CR43","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1080\/20964471.2017.1404232","volume":"1","author":"S Nativi","year":"2017","unstructured":"Nativi, S., Mazzetti, P., Craglia, M.: A view-based model of data-cube to support big earth data systems interoperability. Big Earth Data. 1, 75\u201399 (2017). https:\/\/doi.org\/10.1080\/20964471.2017.1404232","journal-title":"Big Earth Data."},{"key":"6_CR44","unstructured":"USGS Earth Explorer online portal. https:\/\/earthexplorer.usgs.gov\/"},{"key":"6_CR45","unstructured":"Copernicus Sentinel Hub. https:\/\/scihub.copernicus.eu\/"},{"key":"6_CR46","unstructured":"GEOSS portal. https:\/\/www.geoportal.org\/"},{"issue":"Suppl C","key":"6_CR47","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1016\/j.rse.2017.06.031","volume":"202","author":"N Gorelick","year":"2017","unstructured":"Gorelick, N., Hancher, M., Dixon, M., Ilyushchenko, S., Thau, D., Moore, R.: GoogleEarth engine: planetary-scale geospatial analysis for everyone. Remote Sens. Environ. 202(Suppl C), 18\u201327 (2017). https:\/\/doi.org\/10.1016\/j.rse.2017.06.031","journal-title":"Remote Sens. Environ."},{"key":"6_CR48","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1080\/17538947.2014.1003106","volume":"9","author":"P Baumann","year":"2016","unstructured":"Baumann, P., et al.: Big Data analytics for earth sciences: the earthserver approach. Int. J. Digit. Earth. 9, 3\u201329 (2016). https:\/\/doi.org\/10.1080\/17538947.2014.1003106","journal-title":"Int. J. Digit. Earth."},{"key":"6_CR49","doi-asserted-by":"publisher","first-page":"160018","DOI":"10.1038\/sdata.2016.18","volume":"3","author":"M Wilkinson","year":"2016","unstructured":"Wilkinson, M., Dumontier, M., Aalbersberg, I., et al.: The FAIR Guiding Principles for scientific data management and stewardship. Sci. Data. 3, 160018 (2016). https:\/\/doi.org\/10.1038\/sdata.2016.18","journal-title":"Sci. Data."},{"key":"6_CR50","unstructured":"GO FAIR initiative. https:\/\/www.go-fair.org\/"}],"container-title":["Lecture Notes in Computer Science","Resilience in the Digital Age"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-70370-7_6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,2,19]],"date-time":"2021-02-19T23:41:07Z","timestamp":1613778067000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-70370-7_6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030703691","9783030703707"],"references-count":50,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-70370-7_6","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"20 February 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}