{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,30]],"date-time":"2025-07-30T11:43:41Z","timestamp":1753875821284,"version":"3.41.2"},"reference-count":27,"publisher":"Oxford University Press (OUP)","issue":"4","license":[{"start":{"date-parts":[[2024,3,19]],"date-time":"2024-03-19T00:00:00Z","timestamp":1710806400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"DX Fellowship Code","award":["PH8D230001"],"award-info":[{"award-number":["PH8D230001"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,3,29]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>Motivated by the challenges of decentralized genetic data spread across multiple international organizations, GINSA leverages the Global Biodiversity Information Facility infrastructure to automatically retrieve and link small ribosomal subunit sequences with locality information.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>Testing on taxa from major organism groups demonstrates broad applicability across taxonomic levels and dataset sizes.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>GINSA is a freely accessible Python program under the MIT License and can be installed from PyPI via pip.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btae152","type":"journal-article","created":{"date-parts":[[2024,3,19]],"date-time":"2024-03-19T22:38:50Z","timestamp":1710887930000},"source":"Crossref","is-referenced-by-count":0,"title":["GINSA: an accumulator for paired locality and next-generation small ribosomal subunit sequence data"],"prefix":"10.1093","volume":"40","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3141-042X","authenticated-orcid":false,"given":"Eric","family":"Odle","sequence":"first","affiliation":[{"name":"Department of Natural History Sciences, Graduate School of Science, Hokkaido University , Sapporo, Hokkaido 060-0810, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8299-8908","authenticated-orcid":false,"given":"Samuel","family":"Kahng","sequence":"additional","affiliation":[{"name":"Department of Oceanography, University of Hawaii at Manoa , Honolulu, HI 96822, United States"},{"name":"Institute for the Advancement of Higher Education, Hokkaido University , Sapporo, Hokkaido 060-0817, Japan"}]},{"given":"Siratee","family":"Riewluang","sequence":"additional","affiliation":[{"name":"Department of Natural History Sciences, Graduate School of Science, Hokkaido University , Sapporo, Hokkaido 060-0810, Japan"}]},{"given":"Kyoko","family":"Kurihara","sequence":"additional","affiliation":[{"name":"Department of Natural History Sciences, Graduate School of Science, Hokkaido University , Sapporo, Hokkaido 060-0810, Japan"}]},{"given":"Kevin C","family":"Wakeman","sequence":"additional","affiliation":[{"name":"Institute for the Advancement of Higher Education, Hokkaido University , Sapporo, Hokkaido 060-0817, Japan"},{"name":"Graduate School of Science, Hokkaido University , Sapporo, Hokkaido 060-0810, Japan"}]}],"member":"286","published-online":{"date-parts":[[2024,3,19]]},"reference":[{"key":"2024040222425367100_btae152-B1","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1111\/jeu.12691","article-title":"Revisions to the classification, nomenclature, and diversity of eukaryotes","volume":"66","author":"Adl","year":"2019","journal-title":"J Eukaryot Microbiol"},{"key":"2024040222425367100_btae152-B2","doi-asserted-by":"crossref","first-page":"2963","DOI":"10.1093\/nar\/21.13.2963","article-title":"Genbank","volume":"21","author":"Benson","year":"1993","journal-title":"Nucleic Acids Res"},{"key":"2024040222425367100_btae152-B3","doi-asserted-by":"crossref","first-page":"D121","DOI":"10.1093\/nar\/gkac1051","article-title":"The European nucleotide archive in 2022","volume":"51","author":"Burgin","year":"2023","journal-title":"Nucleic Acids Res"},{"key":"2024040222425367100_btae152-B4","doi-asserted-by":"crossref","first-page":"1056","DOI":"10.1007\/s00248-022-02018-4","article-title":"DNA metabarcoding reveals cryptic diversity in Forest soils on the isolated Brazilian Trindade Island, South Atlantic","volume":"85","author":"C\u00e2mara","year":"2023","journal-title":"Microb Ecol"},{"key":"2024040222425367100_btae152-B5","doi-asserted-by":"crossref","first-page":"532","DOI":"10.12688\/f1000research.18676.1","article-title":"pysradb: a python package to query next-generation sequencing metadata and data from NCBI sequence read archive","volume":"8","author":"Choudhary","year":"2019","journal-title":"F1000Res"},{"key":"2024040222425367100_btae152-B6","doi-asserted-by":"crossref","first-page":"122","DOI":"10.1108\/LR-06-2015-0061","article-title":"A formal definition of big data based on its essential features","volume":"65","author":"De Mauro","year":"2016","journal-title":"Library Rev"},{"key":"2024040222425367100_btae152-B7","doi-asserted-by":"crossref","first-page":"btac667","DOI":"10.1093\/bioinformatics\/btac667","article-title":"Metadata retrieval from sequence databases with FFQ","volume":"39","author":"G\u00e1lvez-Merch\u00e1n","year":"2023","journal-title":"Bioinformatics"},{"key":"2024040222425367100_btae152-B8","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1093\/nar\/24.1.13","article-title":"The genome sequence database (GSDB): meeting the challenge of genomic sequencing","volume":"24","author":"Keen","year":"1996","journal-title":"Nucleic Acids Res"},{"key":"2024040222425367100_btae152-B9","doi-asserted-by":"crossref","first-page":"5478","DOI":"10.1073\/pnas.94.10.5478","article-title":"Concordance of gene genealogies reveals reproductive isolation in the pathogenic fungus Coccidioides immitis","volume":"94","author":"Koufopanou","year":"1997","journal-title":"Proc Natl Acad Sci USA"},{"key":"2024040222425367100_btae152-B10","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1016\/j.tplants.2014.11.005","article-title":"Chlorella: 125 years of the green survivalist","volume":"20","author":"Krienitz","year":"2015","journal-title":"Trends Plant Sci"},{"key":"2024040222425367100_btae152-B11","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1093\/sysbio\/syac069","article-title":"Estimating global biodiversity: the role of cryptic insect species","volume":"72","author":"Li","year":"2023","journal-title":"Syst Biol"},{"key":"2024040222425367100_btae152-B12","doi-asserted-by":"crossref","first-page":"49","DOI":"10.1016\/j.ejsobi.2018.03.004","article-title":"Why are we blind to cryptic species? lessons from the eyeless","volume":"86","author":"March\u00e1n","year":"2018","journal-title":"Eur J Soil Biol"},{"key":"2024040222425367100_btae152-B13","doi-asserted-by":"crossref","first-page":"1403","DOI":"10.1007\/s12237-016-0087-z","article-title":"Functional, phylogenetic and host-geographic signatures of Labyrinthula spp. provide for putative species delimitation and a global-scale view of seagrass wasting disease","volume":"39","author":"Martin","year":"2016","journal-title":"Estuaries and Coasts"},{"key":"2024040222425367100_btae152-B14","doi-asserted-by":"crossref","first-page":"76","DOI":"10.3390\/md21020076","article-title":"Cryptic diversity of black band disease cyanobacteria in Siderastrea siderea corals revealed by chemical ecology and comparative genome-resolved metagenomics","volume":"21","author":"Meyer","year":"2023","journal-title":"Mar Drugs"},{"key":"2024040222425367100_btae152-B15","doi-asserted-by":"crossref","first-page":"1231","DOI":"10.1093\/sysbio\/syaa026","article-title":"Repositories for taxonomic data: where we are and what is missing","volume":"69","author":"Miralles","year":"2020","journal-title":"Syst Biol"},{"key":"2024040222425367100_btae152-B16","first-page":"1886","article-title":"Cryptic speciation in the cosmopolitan and clonal human pathogenic fungus Aspergillus fumigatus","volume":"59","author":"Pringle","year":"2005","journal-title":"Evol"},{"key":"2024040222425367100_btae152-B17","doi-asserted-by":"crossref","first-page":"1895","DOI":"10.1038\/s41564-019-0510-x","article-title":"Cryptic inoviruses revealed as pervasive in bacteria and archaea across earth\u2019s biomes","volume":"4","author":"Roux","year":"2019","journal-title":"Nat Microbiol"},{"key":"2024040222425367100_btae152-B18","doi-asserted-by":"crossref","first-page":"207","DOI":"10.1016\/S0932-4739(11)80059-3","article-title":"Protist evolution and phylogeny as discerned from small subunit ribosomal RNA sequence comparisons","volume":"27","author":"Schlegel","year":"1991","journal-title":"Eur J Protistol"},{"key":"2024040222425367100_btae152-B19","doi-asserted-by":"crossref","first-page":"60","DOI":"10.1086\/658657","article-title":"The experimenter\u2019s museum: Genbank, natural history, and the moral economies of biomedicine","volume":"102","author":"Strasser","year":"2011","journal-title":"Isis"},{"key":"2024040222425367100_btae152-B20","doi-asserted-by":"crossref","first-page":"D101","DOI":"10.1093\/nar\/gkac1083","article-title":"DNA data bank of Japan (DDBJ) update report 2022","volume":"51","author":"Tanizawa","year":"2023","journal-title":"Nucleic Acids Res"},{"key":"2024040222425367100_btae152-B21","doi-asserted-by":"crossref","first-page":"3607","DOI":"10.1093\/bioinformatics\/btaa167","article-title":"grabseqs: simple downloading of reads and metadata from multiple next-generation sequencing data repositories","volume":"36","author":"Taylor","year":"2020","journal-title":"Bioinformatics"},{"year":"1995","author":"Van Rossum","key":"2024040222425367100_btae152-B22"},{"key":"2024040222425367100_btae152-B23","doi-asserted-by":"crossref","first-page":"1710","DOI":"10.3390\/plants12081710","article-title":"Population genetic structure and diversity of cryptic species of the plant genus Macrocarpaea (gentianaceae) from the tropical Andes","volume":"12","author":"Vieu","year":"2023","journal-title":"Plants"},{"key":"2024040222425367100_btae152-B24","doi-asserted-by":"crossref","first-page":"514","DOI":"10.1111\/jeu.12059","article-title":"Molecular phylogeny of marine gregarine parasites (apicomplexa) from tube-forming polychaetes (sabellariidae, cirratulidae, and serpulidae), including descriptions of two new species of Selenidium","volume":"60","author":"Wakeman","year":"2013","journal-title":"J Eukaryot Microbiol"},{"year":"2020","author":"Waller","key":"2024040222425367100_btae152-B25"},{"key":"2024040222425367100_btae152-B26","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1146\/annurev-genom-101722-103045","article-title":"Long-read DNA sequencing: recent advances and remaining challenges","volume":"24","author":"Warburton","year":"2023","journal-title":"Annu Rev Genomics Hum Genet"},{"key":"2024040222425367100_btae152-B27","doi-asserted-by":"crossref","first-page":"e16138","DOI":"10.1002\/ajb2.16138","article-title":"An in-depth investigation of cryptic taxonomic diversity in the rare endemic mustard Draba maguirei","volume":"110","author":"Windham","year":"2023","journal-title":"Am J Bot"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btae152\/57021598\/btae152.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/4\/btae152\/57141367\/btae152.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/4\/btae152\/57141367\/btae152.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,2]],"date-time":"2024-04-02T23:02:57Z","timestamp":1712098977000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btae152\/7632091"}},"subtitle":[],"editor":[{"given":"Jonathan","family":"Wren","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2024,3,19]]},"references-count":27,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,3,29]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btae152","relation":{},"ISSN":["1367-4811"],"issn-type":[{"type":"electronic","value":"1367-4811"}],"subject":[],"published-other":{"date-parts":[[2024,4,1]]},"published":{"date-parts":[[2024,3,19]]},"article-number":"btae152"}}