{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T06:36:38Z","timestamp":1769754998655,"version":"3.49.0"},"reference-count":34,"publisher":"Oxford University Press (OUP)","license":[{"start":{"date-parts":[[2019,11,14]],"date-time":"2019-11-14T00:00:00Z","timestamp":1573689600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001700","name":"Ministry of Education, Culture, Sports, Science and Technology","doi-asserted-by":"publisher","award":["JPMJCR1501"],"award-info":[{"award-number":["JPMJCR1501"]}],"id":[{"id":"10.13039\/501100001700","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:p>The Bioinformation and DDBJ Center (https:\/\/www.ddbj.nig.ac.jp) in the National Institute of Genetics (NIG) maintains a primary nucleotide sequence database as a member of the International Nucleotide Sequence Database Collaboration (INSDC) in partnership with the US National Center for Biotechnology Information and the European Bioinformatics Institute. The NIG operates the NIG supercomputer as a computational basis for the construction of DDBJ databases and as a large-scale computational resource for Japanese biologists and medical researchers. In order to accommodate the rapidly growing amount of deoxyribonucleic acid (DNA) nucleotide sequence data, NIG replaced its supercomputer system, which is designed for big data analysis of genome data, in early 2019. The new system is equipped with 30 PB of DNA data archiving storage; large-scale parallel distributed file systems (13.8 PB in total) and 1.1 PFLOPS computation nodes and graphics processing units (GPUs). Moreover, as a starting point of developing multi-cloud infrastructure of bioinformatics, we have also installed an automatic file transfer system that allows users to prevent data lock-in and to achieve cost\/performance balance by exploiting the most suitable environment from among the supercomputer and public clouds for different workloads.<\/jats:p>","DOI":"10.1093\/nar\/gkz982","type":"journal-article","created":{"date-parts":[[2019,10,21]],"date-time":"2019-10-21T15:20:39Z","timestamp":1571671239000},"source":"Crossref","is-referenced-by-count":8,"title":["DDBJ Database updates and computational infrastructure enhancement"],"prefix":"10.1093","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6001-3397","authenticated-orcid":false,"given":"Osamu","family":"Ogasawara","sequence":"first","affiliation":[{"name":"The Bioinformation and DDBJ Center, National Institute of Genetics, Mishima, Shizuoka, 411-8540, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7691-9812","authenticated-orcid":false,"given":"Yuichi","family":"Kodama","sequence":"additional","affiliation":[{"name":"The Bioinformation and DDBJ Center, National Institute of Genetics, Mishima, Shizuoka, 411-8540, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4138-1893","authenticated-orcid":false,"given":"Jun","family":"Mashima","sequence":"additional","affiliation":[{"name":"The Bioinformation and DDBJ Center, National Institute of Genetics, Mishima, Shizuoka, 411-8540, Japan"}]},{"given":"Takehide","family":"Kosuge","sequence":"additional","affiliation":[{"name":"The Bioinformation and DDBJ Center, National Institute of Genetics, Mishima, Shizuoka, 411-8540, Japan"}]},{"given":"Takatomo","family":"Fujisawa","sequence":"additional","affiliation":[{"name":"The Bioinformation and DDBJ Center, National Institute of Genetics, Mishima, Shizuoka, 411-8540, Japan"}]}],"member":"286","published-online":{"date-parts":[[2019,11,14]]},"reference":[{"key":"2019111404585535900_B1","doi-asserted-by":"crossref","first-page":"D69","DOI":"10.1093\/nar\/gky1002","article-title":"DDBJ update: the Genomic expression archive (GEA) for functional genomics data","volume":"47","author":"Kodama","year":"2019","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B2","doi-asserted-by":"crossref","first-page":"D94","DOI":"10.1093\/nar\/gky989","article-title":"GenBank","volume":"47","author":"Sayers","year":"2019","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B3","doi-asserted-by":"crossref","first-page":"D84","DOI":"10.1093\/nar\/gky1078","article-title":"The european nucleotide archive in 2018","volume":"47","author":"Harrison","year":"2019","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B4","doi-asserted-by":"crossref","first-page":"D48","DOI":"10.1093\/nar\/gkx1097","article-title":"The international nucleotide sequence database collaboration","volume":"46","author":"Karsch-Mizrachi","year":"2018","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B5","doi-asserted-by":"crossref","first-page":"D54","DOI":"10.1093\/nar\/gkr854","article-title":"The Sequence Read Archive: explosive growth of sequencing data","volume":"40","author":"Kodama","year":"2012","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B6","doi-asserted-by":"crossref","first-page":"1275","DOI":"10.4056\/sigs.4851102","article-title":"Toward richer metadata for microbial sequences: replacing strain-level NCBI taxonomy taxids with BioProject, BioSample and Assembly records","volume":"9","author":"Federhen","year":"2014","journal-title":"Stand. Genomic Sci."},{"key":"2019111404585535900_B7","doi-asserted-by":"crossref","first-page":"1333","DOI":"10.1126\/science.298.5597.1333b","article-title":"Nucleotide sequence database policies","volume":"298","author":"Brunak","year":"2002","journal-title":"Science"},{"key":"2019111404585535900_B8","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1007\/978-1-4939-3578-9_5","article-title":"The gene expression omnibus database","volume":"1418","author":"Clough","year":"2016","journal-title":"Methods Mol. Biol."},{"key":"2019111404585535900_B9","doi-asserted-by":"crossref","first-page":"D1113","DOI":"10.1093\/nar\/gku1057","article-title":"ArrayExpress update-simplifying data submissions","volume":"43","author":"Kolesnikov","year":"2015","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B10","doi-asserted-by":"crossref","first-page":"D18","DOI":"10.1093\/nar\/gku1120","article-title":"The DDBJ Japanese Genotype-phenotype Archive for genetic and phenotypic human data","volume":"43","author":"Kodama","year":"2015","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B11","doi-asserted-by":"crossref","first-page":"D25","DOI":"10.1093\/nar\/gks1152","article-title":"DDBJ new system and service refactoring","volume":"41","author":"Ogasawara","year":"2013","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B12","doi-asserted-by":"crossref","DOI":"10.1101\/700864","article-title":"Functional annotation of human long Non-Coding RNAs via molecular phenotyping","author":"Ramilowski","year":"2019"},{"key":"2019111404585535900_B13","doi-asserted-by":"crossref","DOI":"10.1101\/626754","article-title":"All of gene expression (AOE): an integrated index for public gene expression databases","author":"Bono","year":"2019"},{"key":"2019111404585535900_B14","doi-asserted-by":"crossref","first-page":"D819","DOI":"10.1093\/nar\/gkw1139","article-title":"The dbGaP data browser: a new tool for browsing dbGaP controlled-access genomic data","volume":"45","author":"Wong","year":"2017","journal-title":"Nucleic Acids Res."},{"key":"2019111404585535900_B15","doi-asserted-by":"crossref","first-page":"692","DOI":"10.1038\/ng.3312","article-title":"The European Genome-phenome Archive of human data consented for biomedical research","volume":"47","author":"Lappalainen","year":"2015","journal-title":"Nat. Genet."},{"key":"2019111404585535900_B16","doi-asserted-by":"crossref","first-page":"220","DOI":"10.1038\/s41587-019-0046-x","article-title":"Federated discovery and sharing of genomic data using Beacons","volume":"37","author":"Fiume","year":"2019","journal-title":"Nat. Biotechnol."},{"key":"2019111404585535900_B17","doi-asserted-by":"crossref","first-page":"406","DOI":"10.1038\/nbt.3790","article-title":"Discovering and linking public omics data sets using the omics discovery index","volume":"35","author":"Perez-Riverol","year":"2017","journal-title":"Nat. Biotechnol."},{"key":"2019111404585535900_B18","volume-title":"Computer Architecture: A Quantitative Approach","author":"Hennessy","year":"2017","edition":"6th edn"},{"key":"2019111404585535900_B19","first-page":"105","article-title":"SGI UV2: a fused computation and data analysis machine","volume-title":"Proceedings of the International Conference on High Performance Computing, Networking, Storage and Analysis","author":"Thorson","year":"2012"},{"key":"2019111404585535900_B20","first-page":"3","article-title":"Databases Theory and Applications, 29th Australasian Database Conference","volume-title":"Lecture Notes in Computer Science","author":"Dreseler","year":"2018"},{"key":"2019111404585535900_B21","doi-asserted-by":"crossref","first-page":"491","DOI":"10.1038\/ng.806","article-title":"A framework for variation discovery and genotyping using next-generation DNA sequencing data","volume":"43","author":"DePristo","year":"2011","journal-title":"Nat. Genet."},{"key":"2019111404585535900_B22","doi-asserted-by":"crossref","first-page":"213","DOI":"10.1038\/nbt.2514","article-title":"Sensitive detection of somatic point mutations in impure and heterogeneous cancer samples","volume":"31","author":"Cibulskis","year":"2013","journal-title":"Nat. Biotechnol."},{"key":"2019111404585535900_B23","doi-asserted-by":"crossref","DOI":"10.1109\/ICC.2017.7996843","article-title":"SINET5: A low-latency and high-bandwidth backbone network for SDN\/NFV Era","volume-title":"IEEE International Conference on Communications (ICC)","author":"Kurimoto","year":"2017"},{"key":"2019111404585535900_B24","volume-title":"IBM Spectrum Scale (formerly GPFS)","author":"Quintero","year":"2015"},{"key":"2019111404585535900_B25","volume-title":"IBM Linear Tape File System Enterprise Edition V1.1.1.2 Installation and Configuration Guide","author":"Coyne","year":"2015"},{"key":"2019111404585535900_B26","volume-title":"IBM Elastic Storage Server Implementation guide for Version 5.3: Common Scenarios and Use Cases","author":"Bolinches","year":"2019"},{"key":"2019111404585535900_B27","volume-title":"IBM TS4500 R5 Tape Library Guide","author":"Coyne","year":"2019"},{"key":"2019111404585535900_B28","doi-asserted-by":"crossref","first-page":"e0177459","DOI":"10.1371\/journal.pone.0177459","article-title":"Singularity: Scientific containers for mobility of compute","volume":"12","author":"Kurtzer","year":"2017","journal-title":"PloS one"},{"key":"2019111404585535900_B29","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1109\/IC2E.2019.00028","article-title":"Importance of Application-level resource management in Multi-cloud deployments","volume-title":"2019 IEEE International Conference on Cloud Engineering (IC2E)","author":"Dimitrijevic","year":"2019"},{"key":"2019111404585535900_B30","first-page":"160","volume-title":"Dynamic Framework for Reconfiguring Computing Resources in the Inter-cloud and Its Application to Genome Analysis Workflows. International Conference on Internet and Distributed Computing Systems","author":"Tanjo","year":"2018"},{"key":"2019111404585535900_B31","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1109\/CloudCom2018.2018.00037","article-title":"Optimal and Feasible Cloud Resource Configurations Generation Method for Genomic Analytics Applications","volume-title":"Proceedings of the 2018 IEEE International Conference on Cloud Computing Technology and Science (CloudCom)","author":"Miura","year":"2018"},{"key":"2019111404585535900_B32","doi-asserted-by":"crossref","first-page":"831","DOI":"10.1109\/CLOUD.2018.00115","article-title":"Optimal Cloud Resource Selection Method Considering Hard and Soft Constraints and Multiple Conflicting Objectives","volume-title":"Proceedings of the 2018 IEEE 11th International Conference on Cloud Computing (CLOUD)","author":"Powell","year":"2018"},{"key":"2019111404585535900_B33","first-page":"298","article-title":"Towards a small diverse pareto-optimal solutions set generator for multiobjective optimization problems","volume-title":"Proceedings of the 2018 Genetic and Evolutionary Computation Conference (GECCO)","author":"Powell","year":"2018"},{"key":"2019111404585535900_B34","doi-asserted-by":"crossref","first-page":"giz052","DOI":"10.1093\/gigascience\/giz052","article-title":"Accumulating computational resource usage of genomic data analysis workflow to optimize cloud computing instance selection","volume":"8","author":"Ohta","year":"2019","journal-title":"Gigascience"}],"container-title":["Nucleic Acids Research"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/nar\/advance-article-pdf\/doi\/10.1093\/nar\/gkz982\/30737568\/gkz982.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"http:\/\/academic.oup.com\/nar\/advance-article-pdf\/doi\/10.1093\/nar\/gkz982\/30737568\/gkz982.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,11,14]],"date-time":"2019-11-14T04:59:46Z","timestamp":1573707586000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/nar\/advance-article\/doi\/10.1093\/nar\/gkz982\/5625536"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,11,14]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1093\/nar\/gkz982","relation":{},"ISSN":["0305-1048","1362-4962"],"issn-type":[{"value":"0305-1048","type":"print"},{"value":"1362-4962","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,11,14]]},"article-number":"gkz982"}}