{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T16:28:46Z","timestamp":1742920126776,"version":"3.40.3"},"publisher-location":"Cham","reference-count":25,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319999869"},{"type":"electronic","value":"9783319999876"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-99987-6_2","type":"book-chapter","created":{"date-parts":[[2018,8,30]],"date-time":"2018-08-30T05:57:05Z","timestamp":1535608625000},"page":"18-32","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["The Use of Distributed Data Storage and Processing Systems in Bioinformatic Data Analysis"],"prefix":"10.1007","author":[{"given":"Micha\u0142","family":"Bochenek","sequence":"first","affiliation":[]},{"given":"Kamil","family":"Folkert","sequence":"additional","affiliation":[]},{"given":"Roman","family":"Jaksik","sequence":"additional","affiliation":[]},{"given":"Micha\u0142","family":"Krzesiak","sequence":"additional","affiliation":[]},{"given":"Marcin","family":"Michalak","sequence":"additional","affiliation":[]},{"given":"Marek","family":"Sikora","sequence":"additional","affiliation":[]},{"given":"Tomasz","family":"St\u0229clik","sequence":"additional","affiliation":[]},{"given":"\u0141ukasz","family":"Wr\u00f3bel","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,8,31]]},"reference":[{"key":"2_CR1","unstructured":"Falco repository. https:\/\/github.com\/VCCRI\/Falco\/. Accessed 11 Dec 2017"},{"key":"2_CR2","unstructured":"The Cancer Genome Atlas. https:\/\/cancergenome.nih.gov\/"},{"issue":"1","key":"2_CR3","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"M Ashburner","year":"2000","unstructured":"Ashburner, M., et al.: Gene ontology: tool for the unification of biology. Nat. Genet. 25(1), 25\u201329 (2000)","journal-title":"Nat. Genet."},{"key":"2_CR4","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1038\/nmeth.3176","volume":"12","author":"B Buchfink","year":"2015","unstructured":"Buchfink, B., Xie, C., Huson, D.: Fast and sensitive protein alignment using DIAMOND. Nat. Methods 12, 59\u201360 (2015)","journal-title":"Nat. Methods"},{"issue":"Part B","key":"2_CR5","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1016\/j.compenvurbsys.2014.02.004","volume":"61","author":"S Gao","year":"2017","unstructured":"Gao, S., Li, L., Li, W., Janowicz, K., Zhang, Y.: Constructing gazetteers from volunteered big geo-data based on Hadoop. Comput. Environ. Urban Syst. 61(Part B), 172\u2013186 (2017)","journal-title":"Comput. Environ. Urban Syst."},{"issue":"5","key":"2_CR6","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1145\/1165389.945450","volume":"37","author":"S Ghemawat","year":"2003","unstructured":"Ghemawat, S., Gobioff, H., Leung, S.T.: The Google file system. SIGOPS Oper. Syst. Rev. 37(5), 29\u201343 (2003)","journal-title":"SIGOPS Oper. Syst. Rev."},{"issue":"5","key":"2_CR7","doi-asserted-by":"publisher","first-page":"646","DOI":"10.1016\/j.cell.2011.02.013","volume":"144","author":"D Hanahan","year":"2011","unstructured":"Hanahan, D., Weinberg, R.: Hallmarks of cancer: the next generation. Cell 144(5), 646\u2013674 (2011)","journal-title":"Cell"},{"issue":"3","key":"2_CR8","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1186\/s40880-015-0050-6","volume":"34","author":"TA Knijnenburg","year":"2015","unstructured":"Knijnenburg, T.A., Bismeijer, T., et al.: A multilevel pan-cancer map links gene mutations to cancer hallmarks. Chin. J. Cancer 34(3), 439\u2013449 (2015)","journal-title":"Chin. J. Cancer"},{"issue":"12","key":"2_CR9","doi-asserted-by":"publisher","first-page":"1585","DOI":"10.1093\/bioinformatics\/btg192","volume":"19","author":"KB Li","year":"2003","unstructured":"Li, K.B.: ClustalW-MPI: ClustalW analysis using distributed and parallel computing. Bioinformatics 19(12), 1585\u20131586 (2003)","journal-title":"Bioinformatics"},{"issue":"4","key":"2_CR10","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1007\/s10723-015-9353-8","volume":"13","author":"D Mrozek","year":"2015","unstructured":"Mrozek, D., Gosk, P., Ma\u0142ysiak-Mrozek, B.: Scaling ab initio predictions of 3D protein structures in Microsoft Azure Cloud. J. Grid Comput. 13(4), 561\u2013585 (2015)","journal-title":"J. Grid Comput."},{"key":"2_CR11","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"723","DOI":"10.1007\/978-3-319-54430-4_69","volume-title":"Intelligent Information and Database Systems","author":"D Mrozek","year":"2017","unstructured":"Mrozek, D., K\u0142apci\u0144ski, A., Ma\u0142ysiak-Mrozek, B.: Orchestrating task execution in Cloud4PSi for scalable processing of macromolecular data of 3D protein structures. In: Nguyen, N.T., Tojo, S., Nguyen, L.M., Trawi\u0144ski, B. (eds.) ACIIDS 2017. LNCS (LNAI), vol. 10192, pp. 723\u2013732. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-54430-4_69"},{"issue":"5","key":"2_CR12","doi-asserted-by":"publisher","first-page":"1194","DOI":"10.1007\/s10766-016-0456-z","volume":"45","author":"P Natesan","year":"2017","unstructured":"Natesan, P., Rajalaxmi, R.R., Gowrison, G., Balasubramanie, P.: Hadoop based parallel binary bat algorithm for network intrusion detection. Int. J. Parallel Program. 45(5), 1194\u20131213 (2017)","journal-title":"Int. J. Parallel Program."},{"issue":"1","key":"2_CR13","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1145\/2492101.1555384","volume":"37","author":"T Sandholm","year":"2009","unstructured":"Sandholm, T., Lai, K.: MapReduce optimization using regulated dynamic prioritization. SIGMETRICS Perform. Eval. Rev. 37(1), 299\u2013310 (2009)","journal-title":"SIGMETRICS Perform. Eval. Rev."},{"key":"2_CR14","doi-asserted-by":"crossref","unstructured":"Sarnovsky, M., Butka, P., Huzvarova, A.: Twitter data analysis and visualizations using the R language on top of the Hadoop platform. In: IEEE 15th International Symposium on Applied Machine Intelligence and Informatics, pp. 327\u2013331 (2017)","DOI":"10.1109\/SAMI.2017.7880327"},{"issue":"Suppl. 1","key":"2_CR15","doi-asserted-by":"publisher","first-page":"D674","DOI":"10.1093\/nar\/gkn653","volume":"37","author":"CF Schaefer","year":"2009","unstructured":"Schaefer, C.F., Anthony, K., et al.: PID: the pathway interaction database. Nucleic Acids Res. 37(Suppl. 1), D674\u2013D679 (2009)","journal-title":"Nucleic Acids Res."},{"issue":"B","key":"2_CR16","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1016\/j.compenvurbsys.2013.12.003","volume":"61","author":"JL Schnase","year":"2017","unstructured":"Schnase, J.L., Duffy, D.Q., et al.: MERRA analytic services: meeting the big data challenges of climate science through cloud-enabled climate analytics-as-a-service. Comput. Environ. Urban Syst. 61(B), 198\u2013211 (2017)","journal-title":"Comput. Environ. Urban Syst."},{"issue":"1","key":"2_CR17","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1186\/1471-2105-6-34","volume":"6","author":"SP Shah","year":"2005","unstructured":"Shah, S.P., Huang, Y., Xu, T., et al.: Atlas-a data warehouse for integrative bioinformatics. BMC Bioinform. 6(1), 34 (2005)","journal-title":"BMC Bioinform."},{"issue":"22","key":"2_CR18","doi-asserted-by":"publisher","first-page":"4673","DOI":"10.1093\/nar\/22.22.4673","volume":"22","author":"JD Thompson","year":"1994","unstructured":"Thompson, J.D., Higgins, D.G., Gibson, T.J.: CLUSTAL W: improving the sensitivity of progressive multiple sequence alignment through sequence weighting, position-specific gap penalties and weight matrix choice. Nucleic Acids Res. 22(22), 4673\u20134680 (1994)","journal-title":"Nucleic Acids Res."},{"issue":"2","key":"2_CR19","first-page":"49","volume":"5","author":"TT Thoralf","year":"2008","unstructured":"Thoralf, T.T., Kormeier, B., Klassen, A., Hofest\u00e4dt, R.: BioDWH: a data warehouse kit for life science data integration. J. Integr. Bioinform. 5(2), 49\u201357 (2008)","journal-title":"J. Integr. Bioinform."},{"issue":"1","key":"2_CR20","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1186\/s13015-017-0116-x","volume":"12","author":"S Wan","year":"2017","unstructured":"Wan, S., Zou, Q.: HAlign-II: efficient ultra-large multiple sequence alignment and phylogenetic tree reconstruction with distributed and parallel computing. Algorithms Mol. Biol. 12(1), 25 (2017)","journal-title":"Algorithms Mol. Biol."},{"key":"2_CR21","volume-title":"The Definitive Guide","author":"T White","year":"2009","unstructured":"White, T.: The Definitive Guide. O\u2019Reilly Media, Newton (2009)"},{"issue":"5","key":"2_CR22","doi-asserted-by":"crossref","first-page":"767","DOI":"10.1093\/bioinformatics\/btw732","volume":"33","author":"A Yang","year":"2017","unstructured":"Yang, A., Troup, M., Lin, P., Ho, J.: Falco: a quick and flexible single-cell RNA-seq processing framework on the cloud. Bioinformatics 33(5), 767\u2013769 (2017)","journal-title":"Bioinformatics"},{"issue":"3","key":"2_CR23","first-page":"1037","volume":"13","author":"M Yang","year":"2017","unstructured":"Yang, M., Mei, H., Huang, D.: An effective detection of satellite images via k-means clustering on Hadoop system. Int. J. Innov. Comput. Inf. Control 13(3), 1037\u20131046 (2017)","journal-title":"Int. J. Innov. Comput. Inf. Control"},{"issue":"Suppl. C","key":"2_CR24","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1016\/j.jbiotec.2017.02.020","volume":"257","author":"J Yu","year":"2017","unstructured":"Yu, J., Blom, J., Sczyrba, A., Goesmann, A.: Rapid protein alignment in the cloud: HAMOND combines fast DIAMOND alignments with Hadoop parallelism. J. Biotechnol. 257(Suppl. C), 58\u201360 (2017)","journal-title":"J. Biotechnol."},{"issue":"15","key":"2_CR25","doi-asserted-by":"publisher","first-page":"2475","DOI":"10.1093\/bioinformatics\/btv177","volume":"31","author":"Q Zou","year":"2015","unstructured":"Zou, Q., Hu, Q., et al.: HAlign: Fast multiple similar DNA\/RNA sequence alignment based on the centre star strategy. Bioinformatics 31(15), 2475\u20132481 (2015)","journal-title":"Bioinformatics"}],"container-title":["Communications in Computer and Information Science","Beyond Databases, Architectures and Structures. Facing the Challenges of Data Proliferation and Growing Variety"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-99987-6_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,7]],"date-time":"2024-03-07T14:29:09Z","timestamp":1709821749000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-99987-6_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319999869","9783319999876"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-99987-6_2","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"31 August 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"BDAS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference: Beyond Databases, Architectures and Structures","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Pozna\u0144","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Poland","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"bdas2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/bdas.polsl.pl\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}