{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,19]],"date-time":"2026-01-19T10:30:02Z","timestamp":1768818602584,"version":"3.49.0"},"reference-count":100,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T00:00:00Z","timestamp":1725321600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T00:00:00Z","timestamp":1725321600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/mur","name":"Universit\u00e0 di Parma","doi-asserted-by":"publisher","id":[{"id":"10.13039\/mur","id-type":"DOI","asserted-by":"publisher"}]},{"name":"CINI","award":["InfoLife"],"award-info":[{"award-number":["InfoLife"]}]},{"name":"European Union \u2013 Next Generation EU programme","award":["Project Age-It (Ageing Well in an Ageing Society)"],"award-info":[{"award-number":["Project Age-It (Ageing Well in an Ageing Society)"]}]},{"name":"Ministero dell\u2019Universit\u00e0 e della Ricerca of Italy","award":["ReGAInS"],"award-info":[{"award-number":["ReGAInS"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BioData Mining"],"DOI":"10.1186\/s13040-024-00380-2","type":"journal-article","created":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T10:02:55Z","timestamp":1725357775000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Seven quick tips for gene-focused computational pangenomic analysis"],"prefix":"10.1186","volume":"17","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1637-7545","authenticated-orcid":false,"given":"Vincenzo","family":"Bonnici","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6279-6660","authenticated-orcid":false,"given":"Davide","family":"Chicco","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,9,3]]},"reference":[{"key":"380_CR1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-38281-0","volume-title":"The pangenome: Diversity, dynamics and evolution of genomes","author":"H Tettelin","year":"2020","unstructured":"Tettelin H, Medini D. The pangenome: Diversity, dynamics and evolution of genomes. Berlin: Springer Nature; 2020."},{"issue":"39","key":"380_CR2","doi-asserted-by":"publisher","first-page":"13950","DOI":"10.1073\/pnas.0506758102","volume":"102","author":"H Tettelin","year":"2005","unstructured":"Tettelin H, Masignani V, Cieslewicz MJ, Donati C, Medini D, Ward NL, et al. Genome analysis of multiple pathogenic isolates of Streptococcus agalactiae: implications for the microbial \u201cpan-genome\u2019\u2019. Proc Natl Acad Sci. 2005;102(39):13950\u20135.","journal-title":"Proc Natl Acad Sci."},{"key":"380_CR3","volume-title":"Thompson & Thompson genetics in medicine","author":"RL Nussbaum","year":"2015","unstructured":"Nussbaum RL, McInnes RR, Willard HF. Thompson & Thompson genetics in medicine. Amsterdam: Elsevier Health Sciences; 2015."},{"key":"380_CR4","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1146\/annurev.genet.39.073003.114725","volume":"39","author":"EV Koonin","year":"2005","unstructured":"Koonin EV. Orthologs, paralogs, and evolutionary genomics. Annu Rev Genet. 2005;39:309\u201338.","journal-title":"Annu Rev Genet."},{"issue":"8","key":"380_CR5","doi-asserted-by":"publisher","first-page":"472","DOI":"10.1038\/nrg3962","volume":"16","author":"SM Soucy","year":"2015","unstructured":"Soucy SM, Huang J, Gogarten JP. Horizontal gene transfer: building the web of life. Nat Rev Genet. 2015;16(8):472\u201382.","journal-title":"Nat Rev Genet."},{"key":"380_CR6","doi-asserted-by":"crossref","unstructured":"Hiller NL, Janto B, Hogg JS, Boissy R, Yu S, Powell E, et\u00a0al. Comparative genomic analyses of seventeen Streptococcus pneumoniae strains: insights into the pneumococcal supragenome. J Bacteriol. 2007;189(22).","DOI":"10.1128\/JB.00690-07"},{"issue":"10","key":"380_CR7","doi-asserted-by":"publisher","first-page":"1580","DOI":"10.1038\/s41564-022-01208-7","volume":"7","author":"F Rosconi","year":"2022","unstructured":"Rosconi F, Rudmann E, Li J, Surujon D, Anthony J, Frank M, et al. A bacterial pan-genome makes gene essentiality strain-dependent and evolvable. Nat Microbiol. 2022;7(10):1580\u201392.","journal-title":"Nat Microbiol."},{"key":"380_CR8","doi-asserted-by":"crossref","unstructured":"Bonizzoni P, De\u00a0Felice C, Pirola Y, Rizzi R, Zaccagnino R, Zizza R. Can formal languages help pangenomics to represent and analyze multiple genomes? In: Proceedings of DLT\u00a02022 \u2013 the 22nd International Conference on Developments in Language Theory. Berlin: Springer; 2022. pp. 3\u201312.","DOI":"10.1007\/978-3-031-05578-2_1"},{"issue":"1","key":"380_CR9","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1007\/s11047-022-09882-6","volume":"21","author":"JA Baaijens","year":"2022","unstructured":"Baaijens JA, Bonizzoni P, Boucher C, Della Vedova G, Pirola Y, Rizzi R, et al. Computational graph pangenomics: a tutorial on data structures and their applications. Nat Comput. 2022;21(1):81\u2013108.","journal-title":"Nat Comput."},{"issue":"7960","key":"380_CR10","doi-asserted-by":"publisher","first-page":"312","DOI":"10.1038\/s41586-023-05896-x","volume":"617","author":"WW Liao","year":"2023","unstructured":"Liao WW, Asri M, Ebler J, Doerr D, Haukness M, Hickey G, et al. A draft human pangenome reference. Nature. 2023;617(7960):312\u201324.","journal-title":"Nature."},{"key":"380_CR11","doi-asserted-by":"crossref","unstructured":"Ceres KM, Stanhope MJ, Gr\u00f6hn YT. A critical evaluation of Mycobacterium bovis pangenomics, with reference to its utility in outbreak investigation. Microb Genomics. 2022;8(6):1\u20138.","DOI":"10.1099\/mgen.0.000839"},{"issue":"6","key":"380_CR12","doi-asserted-by":"publisher","first-page":"589","DOI":"10.1016\/j.gde.2005.09.006","volume":"15","author":"D Medini","year":"2005","unstructured":"Medini D, Donati C, Tettelin H, Masignani V, Rappuoli R. The microbial pan-genome. Curr Opin Genet Dev. 2005;15(6):589\u201394.","journal-title":"Curr Opin Genet Dev."},{"issue":"5","key":"380_CR13","doi-asserted-by":"publisher","first-page":"472","DOI":"10.1016\/j.mib.2008.09.006","volume":"11","author":"H Tettelin","year":"2008","unstructured":"Tettelin H, Riley D, Cattuto C, Medini D. Comparative genomics: the bacterial pan-genome. Curr Opin Microbiol. 2008;11(5):472\u20137.","journal-title":"Curr Opin Microbiol."},{"issue":"8","key":"380_CR14","doi-asserted-by":"publisher","first-page":"987","DOI":"10.1038\/ng.195","volume":"40","author":"KE Holt","year":"2008","unstructured":"Holt KE, Parkhill J, Mazzoni CJ, Roumagnac P, Weill FX, Goodhead I, et al. High-throughput sequencing provides insights into genome variation and evolution in Salmonella typhi. Nat Genet. 2008;40(8):987\u201393.","journal-title":"Nat Genet."},{"issue":"5","key":"380_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/nmicrobiol.2016.41","volume":"1","author":"SG Earle","year":"2016","unstructured":"Earle SG, Wu CH, Charlesworth J, Stoesser N, Gordon NC, Walker TM, et al. Identifying lineage effects when controlling for population structure improves power in bacterial association studies. Nat Microbiol. 2016;1(5):1\u20138.","journal-title":"Nat Microbiol."},{"issue":"25\u201326","key":"380_CR16","doi-asserted-by":"publisher","first-page":"3245","DOI":"10.1016\/j.vaccine.2009.01.072","volume":"27","author":"D Serruto","year":"2009","unstructured":"Serruto D, Serino L, Masignani V, Pizza M. Genome-based approaches to develop vaccines against bacterial pathogens. Vaccine. 2009;27(25\u201326):3245\u201350.","journal-title":"Vaccine."},{"issue":"11\u201312","key":"380_CR17","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1016\/j.drudis.2007.04.008","volume":"12","author":"A Muzzi","year":"2007","unstructured":"Muzzi A, Masignani V, Rappuoli R. The pan-genome: towards a knowledge-based discovery of novel targets for vaccines and antibacterials. Drug Discov Today. 2007;12(11\u201312):429\u201339.","journal-title":"Drug Discov Today."},{"key":"380_CR18","doi-asserted-by":"publisher","first-page":"71536","DOI":"10.3389\/fmicb.2014.00110","volume":"5","author":"Y Zhang","year":"2014","unstructured":"Zhang Y, Sievert SM. Pan-genome analyses identify lineage-and niche-specific markers of evolution and adaptation in epsilonproteobacteria. Front Microbiol. 2014;5:71536.","journal-title":"Front Microbiol."},{"key":"380_CR19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2164-11-1","volume":"11","author":"G D\u2019Auria","year":"2010","unstructured":"D\u2019Auria G, Jim\u00e9nez-Hern\u00e1ndez N, Peris-Bondia F, Moya A, Latorre A. Legionella pneumophila pangenome reveals strain-specific virulence factors. BMC Genomics. 2010;11:1\u201313.","journal-title":"BMC Genomics."},{"issue":"12","key":"380_CR20","doi-asserted-by":"publisher","first-page":"eadd8911","DOI":"10.1126\/sciadv.add8911","volume":"9","author":"A Rubio","year":"2023","unstructured":"Rubio A, Sprang M, Garz\u00f3n A, Moreno-Rodriguez A, Pach\u00f3n-Ib\u00e1\u00f1ez ME, Pach\u00f3n J, et al. Analysis of bacterial pangenomes reduces CRISPR dark matter and reveals strong association between membranome and CRISPR-Cas systems. Sci Adv. 2023;9(12):eadd8911.","journal-title":"Sci Adv."},{"issue":"1","key":"380_CR21","doi-asserted-by":"publisher","first-page":"24373","DOI":"10.1038\/srep24373","volume":"6","author":"NM Chaudhari","year":"2016","unstructured":"Chaudhari NM, Gupta VK, Dutta C. BPGA-an ultra-fast pan-genome analysis pipeline. Sci Rep. 2016;6(1):24373.","journal-title":"Sci Rep."},{"key":"380_CR22","doi-asserted-by":"publisher","first-page":"e1319","DOI":"10.7717\/peerj.1319","volume":"3","author":"AM Eren","year":"2015","unstructured":"Eren AM, Esen \u00d6C, Quince C, Vineis JH, Morrison HG, Sogin ML, et al. Anvi\u2019o: an advanced analysis and visualization platform for \u2018omics data. PeerJ. 2015;3:e1319.","journal-title":"PeerJ."},{"key":"380_CR23","doi-asserted-by":"publisher","first-page":"265","DOI":"10.12688\/f1000research.2-265.v1","volume":"2","author":"O Lukjancenko","year":"2013","unstructured":"Lukjancenko O, Thomsen MC, Voldby Larsen M, Ussery DW. PanFunPro: pan-genome analysis based on FUNctional PROfiles. F1000Research. 2013;2:265.","journal-title":"F1000Research."},{"issue":"1","key":"380_CR24","doi-asserted-by":"publisher","first-page":"135","DOI":"10.4056\/sigs.38923","volume":"2","author":"L Snipen","year":"2010","unstructured":"Snipen L, Ussery DW. Standard operating procedure for computing pangenome trees. Stand Genomic Sci. 2010;2(1):135\u201341.","journal-title":"Stand Genomic Sci."},{"key":"380_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-015-0517-0","volume":"16","author":"L Snipen","year":"2015","unstructured":"Snipen L, Liland KH. micropan: an R-package for microbial pan-genomics. BMC Bioinformatics. 2015;16:1\u20138.","journal-title":"BMC Bioinformatics."},{"issue":"1","key":"380_CR26","doi-asserted-by":"publisher","first-page":"e5","DOI":"10.1093\/nar\/gkx977","volume":"46","author":"W Ding","year":"2018","unstructured":"Ding W, Baumdicker F, Neher RA. panX: pan-genome analysis and exploration. Nucleic Acids Res. 2018;46(1):e5.","journal-title":"Nucleic Acids Res."},{"issue":"8","key":"380_CR27","doi-asserted-by":"publisher","first-page":"e1011319","DOI":"10.1371\/journal.pcbi.1011319","volume":"19","author":"T Lubiana","year":"2023","unstructured":"Lubiana T, Lopes R, Medeiros P, Silva JC, Goncalves ANA, Maracaja-Coutinho V, et al. Ten quick tips for harnessing the power of ChatGPT in computational biology. PLoS Comput Biol. 2023;19(8):e1011319.","journal-title":"PLoS Comput Biol."},{"issue":"12","key":"380_CR28","doi-asserted-by":"publisher","first-page":"e1010669","DOI":"10.1371\/journal.pcbi.1010669","volume":"18","author":"Q Hou","year":"2022","unstructured":"Hou Q, Waury K, Gogishvili D, Feenstra KA. Ten quick tips for sequence-based prediction of protein properties using machine learning. PLoS Comput Biol. 2022;18(12):e1010669.","journal-title":"PLoS Comput Biol."},{"issue":"3","key":"380_CR29","doi-asserted-by":"publisher","first-page":"e1009803","DOI":"10.1371\/journal.pcbi.1009803","volume":"18","author":"BD Lee","year":"2022","unstructured":"Lee BD, Gitter A, Greene CS, Raschka S, Maguire F, Titus AJ, et al. Ten quick tips for deep learning in biology. PLoS Comput Biol. 2022;18(3):e1009803.","journal-title":"PLoS Comput Biol."},{"issue":"5","key":"380_CR30","doi-asserted-by":"publisher","first-page":"e1006906","DOI":"10.1371\/journal.pcbi.1006906","volume":"15","author":"YA Tang","year":"2019","unstructured":"Tang YA, Pichler K, F\u00fcllgrabe A, Lomax J, Malone J, Munoz-Torres MC, et al. Ten quick tips for biocuration. PLoS Comput Biol. 2019;15(5):e1006906.","journal-title":"PLoS Comput Biol."},{"issue":"8","key":"380_CR31","doi-asserted-by":"publisher","first-page":"e1010357","DOI":"10.1371\/journal.pcbi.1010357","volume":"18","author":"R Diaz-Uriarte","year":"2022","unstructured":"Diaz-Uriarte R, G\u00f3mez\u00a0de\u00a0Lope E, Giugno R, Fr\u00f6hlich H, Nazarov PV. Nepomuceno-Chamorro IA, et\u00a0al. Ten quick tips for biomarker discovery and validation analyses using machine learning. PLoS Comput Biol. 2022;18(8):e1010357.","journal-title":"PLoS Comput Biol."},{"issue":"6","key":"380_CR32","doi-asserted-by":"publisher","first-page":"e1006907","DOI":"10.1371\/journal.pcbi.1006907","volume":"15","author":"LH Nguyen","year":"2019","unstructured":"Nguyen LH, Holmes S. Ten quick tips for effective dimensionality reduction. PLoS Comput Biol. 2019;15(6):e1006907.","journal-title":"PLoS Comput Biol."},{"issue":"8","key":"380_CR33","doi-asserted-by":"publisher","first-page":"e1010348","DOI":"10.1371\/journal.pcbi.1010348","volume":"18","author":"D Chicco","year":"2022","unstructured":"Chicco D, Agapito G. Nine quick tips for pathway enrichment analysis. PLoS Comput Biol. 2022;18(8):e1010348.","journal-title":"PLoS Comput Biol."},{"key":"380_CR34","doi-asserted-by":"crossref","unstructured":"Leimbach A, Hacker J, Dobrindt U. E. coli as an all-rounder: the thin line between commensalism and pathogenicity. Between Pathogenicity Commensalism. 2013;358:3\u201332.","DOI":"10.1007\/82_2012_303"},{"issue":"9","key":"380_CR35","doi-asserted-by":"publisher","first-page":"4000","DOI":"10.1111\/1462-2920.15186","volume":"22","author":"WA Overholt","year":"2020","unstructured":"Overholt WA, H\u00f6lzer M, Geesink P, Diezel C, Marz M, K\u00fcsel K. Inclusion of Oxford Nanopore long reads improves all microbial and viral metagenome-assembled genomes from a complex aquifer system. Environ Microbiol. 2020;22(9):4000\u201313.","journal-title":"Environ Microbiol."},{"key":"380_CR36","doi-asserted-by":"crossref","unstructured":"Wick RR, Judd LM, Gorrie CL, Holt KE. Completing bacterial genome assemblies with multiplex MinION sequencing. Microb Genomics. 2017;3(10)3\u201332.","DOI":"10.1099\/mgen.0.000132"},{"issue":"12","key":"380_CR37","doi-asserted-by":"publisher","first-page":"2857","DOI":"10.1128\/JCM.00949-16","volume":"54","author":"AS Gargis","year":"2016","unstructured":"Gargis AS, Kalman L, Lubin IM. Assuring the quality of next-generation sequencing in clinical microbiology and public health laboratories. J Clin Microbiol. 2016;54(12):2857\u201365.","journal-title":"J Clin Microbiol."},{"issue":"1","key":"380_CR38","doi-asserted-by":"publisher","first-page":"662","DOI":"10.1186\/s12864-019-6014-5","volume":"20","author":"TH Smits","year":"2019","unstructured":"Smits TH. The importance of genome sequence quality to microbial comparative genomics. BMC Genomics. 2019;20(1):662.","journal-title":"BMC Genomics."},{"issue":"5626","key":"380_CR39","doi-asserted-by":"publisher","first-page":"1706","DOI":"10.1126\/science.1086292","volume":"300","author":"JA Eisen","year":"2003","unstructured":"Eisen JA, Fraser CM. Phylogenomics: intersection of evolution and genomics. Science. 2003;300(5626):1706\u20137.","journal-title":"Science."},{"issue":"1","key":"380_CR40","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12859-020-03657-5","volume":"21","author":"M Gabrielaite","year":"2020","unstructured":"Gabrielaite M, Marvig RL. GenAPI: a tool for gene absence-presence identification in fragmented bacterial genome sequences. BMC Bioinformatics. 2020;21(1):1\u20138.","journal-title":"BMC Bioinformatics."},{"issue":"6","key":"380_CR41","doi-asserted-by":"publisher","first-page":"bbac413","DOI":"10.1093\/bib\/bbac413","volume":"23","author":"T Li","year":"2022","unstructured":"Li T, Yin Y. Critical assessment of pan-genomic analysis of metagenome-assembled genomes. Brief Bioinforma. 2022;23(6):bbac413.","journal-title":"Brief Bioinforma."},{"issue":"6","key":"380_CR42","doi-asserted-by":"publisher","first-page":"905","DOI":"10.1007\/s12551-021-00865-y","volume":"13","author":"JC Setubal","year":"2021","unstructured":"Setubal JC. Metagenome-assembled genomes: concepts, analogies, and challenges. Biophys Rev. 2021;13(6):905\u20139.","journal-title":"Biophys Rev."},{"issue":"8","key":"380_CR43","doi-asserted-by":"publisher","first-page":"725","DOI":"10.1038\/nbt.3893","volume":"35","author":"RM Bowers","year":"2017","unstructured":"Bowers RM, Kyrpides NC, Stepanauskas R, Harmon-Smith M, Doud D, Reddy TBK, et al. Minimum information about a single amplified genome (MISAG) and a metagenome-assembled genome (MIMAG) of bacteria and archaea. Nat Biotechnol. 2017;35(8):725\u201331.","journal-title":"Nat Biotechnol."},{"key":"380_CR44","doi-asserted-by":"publisher","first-page":"104552","DOI":"10.1016\/j.jbi.2023.104552","volume":"148","author":"V Bonnici","year":"2023","unstructured":"Bonnici V, Mengoni C, Mangoni M, Franco G, Giugno R. PanDelos-frags: A methodology for discovering pangenomic content of incomplete microbial assemblies. J Biomed Inform. 2023;148:104552.","journal-title":"J Biomed Inform."},{"issue":"1","key":"380_CR45","doi-asserted-by":"publisher","first-page":"9670","DOI":"10.1038\/s41598-018-27800-8","volume":"8","author":"A Veras","year":"2018","unstructured":"Veras A, Araujo F, Pinheiro K, Guimar\u00e3es L, Azevedo V, Soares S, et al. Pan4Draft: a computational tool to improve the accuracy of pan-genomic analysis using draft genomes. Sci Rep. 2018;8(1):9670.","journal-title":"Sci Rep."},{"key":"380_CR46","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13059-020-02090-4","volume":"21","author":"G Tonkin-Hill","year":"2020","unstructured":"Tonkin-Hill G, MacAlasdair N, Ruis C, Weimann A, Horesh G, Lees JA, et al. Producing polished prokaryotic pangenomes with the Panaroo pipeline. Genome Biol. 2020;21:1\u201321.","journal-title":"Genome Biol."},{"issue":"11","key":"380_CR47","doi-asserted-by":"publisher","first-page":"1071","DOI":"10.1089\/cmb.2017.0013","volume":"24","author":"CJ Castro","year":"2017","unstructured":"Castro CJ, Ng TFF. U50: a new metric for measuring assembly output based on non-overlapping, target-specific contigs. J Comput Biol. 2017;24(11):1071\u201380.","journal-title":"J Comput Biol."},{"issue":"8","key":"380_CR48","doi-asserted-by":"publisher","first-page":"2444","DOI":"10.1073\/pnas.85.8.2444","volume":"85","author":"WR Pearson","year":"1988","unstructured":"Pearson WR, Lipman DJ. Improved tools for biological sequence comparison. Proc Natl Acad Sci. 1988;85(8):2444\u20138.","journal-title":"Proc Natl Acad Sci."},{"key":"380_CR49","unstructured":"National Library of Medicine. GenBank Overview. 2023. https:\/\/www.ncbi.nlm.nih.gov\/genbank\/. Accessed 4 Nov 2023."},{"key":"380_CR50","unstructured":"Ensembl. GFF\/GTF File Format - Definition and supported options. 2023. https:\/\/www.ensembl.org\/info\/website\/upload\/gff.html. Accessed 4 Nov 2023."},{"key":"380_CR51","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-11-119","volume":"11","author":"D Hyatt","year":"2010","unstructured":"Hyatt D, Chen GL, LoCascio PF, Land ML, Larimer FW, Hauser LJ. Prodigal: prokaryotic gene recognition and translation initiation site identification. BMC Bioinformatics. 2010;11:1\u201311.","journal-title":"BMC Bioinformatics."},{"issue":"14","key":"380_CR52","doi-asserted-by":"publisher","first-page":"2068","DOI":"10.1093\/bioinformatics\/btu153","volume":"30","author":"T Seemann","year":"2014","unstructured":"Seemann T. Prokka: rapid prokaryotic genome annotation. Bioinformatics. 2014;30(14):2068\u20139.","journal-title":"Bioinformatics."},{"key":"380_CR53","doi-asserted-by":"crossref","unstructured":"Vernikos G. A review of pangenome tools and recent studies. In: The Pangenome: Diversity, Dynamics and Evolution of Genomes, chap 4. Berlin: Springer International Publishing; 2020. pp. 89\u2013112.","DOI":"10.1007\/978-3-030-38281-0_4"},{"key":"380_CR54","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-10-421","volume":"10","author":"C Camacho","year":"2009","unstructured":"Camacho C, Coulouris G, Avagyan V, Ma N, Papadopoulos J, Bealer K, et al. BLAST+: architecture and applications. BMC Bioinformatics. 2009;10:1\u20139.","journal-title":"BMC Bioinformatics."},{"issue":"1","key":"380_CR55","doi-asserted-by":"publisher","first-page":"6","DOI":"10.1038\/s41562-017-0189-z","volume":"2","author":"DJ Benjamin","year":"2018","unstructured":"Benjamin DJ, Berger JO, Johannesson M, Nosek BA, Wagenmakers EJ, Berk R, et al. Redefine statistical significance. Nat Hum Behav. 2018;2(1):6\u201310.","journal-title":"Nat Hum Behav."},{"key":"380_CR56","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-10-154","volume":"10","author":"J Blom","year":"2009","unstructured":"Blom J, Albaum SP, Doppmeier D, P\u00fchler A, Vorh\u00f6lter FJ, Zakrzewski M, et al. EDGAR: a software framework for the comparative analysis of prokaryotic genomes. BMC Bioinformatics. 2009;10:1\u201314.","journal-title":"BMC Bioinformatics."},{"issue":"15","key":"380_CR57","first-page":"47","volume":"19","author":"V Bonnici","year":"2018","unstructured":"Bonnici V, Giugno R, Manca V. PanDelos: a dictionary-based method for pan-genome content discovery. BMC Bioinformatics. 2018;19(15):47\u201359.","journal-title":"BMC Bioinformatics."},{"key":"380_CR58","doi-asserted-by":"publisher","first-page":"117793222093806","DOI":"10.1177\/1177932220938064","volume":"14","author":"SS Costa","year":"2020","unstructured":"Costa SS, Guimar\u00e3es LC, Silva A, Soares SC, Bara\u00fana RA. First steps in the analysis of prokaryotic pan-genomes. Bioinforma Biol Insights. 2020;14:1177932220938064.","journal-title":"Bioinforma Biol Insights."},{"key":"380_CR59","doi-asserted-by":"crossref","unstructured":"Kim M, Oh HS, Park SC, Chun J. Towards a taxonomic coherence between average nucleotide identity and 16S rRNA gene sequence similarity for species demarcation of prokaryotes. Int J Syst Evol Microbiol. 2014;64(Pt_2):346\u2013351.","DOI":"10.1099\/ijs.0.059774-0"},{"issue":"22","key":"380_CR60","doi-asserted-by":"publisher","first-page":"3691","DOI":"10.1093\/bioinformatics\/btv421","volume":"31","author":"AJ Page","year":"2015","unstructured":"Page AJ, Cummins CA, Hunt M, Wong VK, Reuter S, Holden MT, et al. Roary: rapid large-scale prokaryote pan genome analysis. Bioinformatics. 2015;31(22):3691\u20133.","journal-title":"Bioinformatics."},{"issue":"3","key":"380_CR61","doi-asserted-by":"publisher","first-page":"bbaa198","DOI":"10.1093\/bib\/bbaa198","volume":"22","author":"V Bonnici","year":"2021","unstructured":"Bonnici V, Maresi E, Giugno R. Challenges in gene-oriented approaches for pangenome content discovery. Brief Bioinforma. 2021;22(3):bbaa198.","journal-title":"Brief Bioinforma."},{"issue":"4","key":"380_CR62","doi-asserted-by":"publisher","first-page":"1115","DOI":"10.1093\/molbev\/msr268","volume":"29","author":"DA Dalquen","year":"2012","unstructured":"Dalquen DA, Anisimova M, Gonnet GH, Dessimoz C. ALF-a simulation framework for genome evolution. Mol Biol Evol. 2012;29(4):1115\u201323.","journal-title":"Mol Biol Evol."},{"issue":"4","key":"380_CR63","doi-asserted-by":"publisher","first-page":"1785","DOI":"10.1038\/s41596-020-00480-3","volume":"16","author":"F Meyer","year":"2021","unstructured":"Meyer F, Lesker TR, Koslicki D, Fritz A, Gurevich A, Darling AE, et al. Tutorial: assessing metagenomics software with the CAMI benchmarking toolkit. Nat Protoc. 2021;16(4):1785\u2013801.","journal-title":"Nat Protoc."},{"issue":"9","key":"380_CR64","doi-asserted-by":"publisher","first-page":"2631","DOI":"10.1093\/bioinformatics\/btac158","volume":"38","author":"V Bonnici","year":"2022","unstructured":"Bonnici V, Giugno R. PANPROVA: pangenomic prokaryotic evolution of full assemblies. Bioinformatics. 2022;38(9):2631\u20132.","journal-title":"Bioinformatics."},{"key":"380_CR65","doi-asserted-by":"publisher","first-page":"664","DOI":"10.1016\/j.neucom.2017.06.053","volume":"267","author":"A Saxena","year":"2017","unstructured":"Saxena A, Prasad M, Gupta A, Bharill N, Patel OP, Tiwari A, et al. A review of clustering techniques and developments. Neurocomputing. 2017;267:664\u201381.","journal-title":"Neurocomputing."},{"issue":"7","key":"380_CR66","doi-asserted-by":"publisher","first-page":"1081","DOI":"10.1093\/bioinformatics\/btw761","volume":"33","author":"TL Pedersen","year":"2017","unstructured":"Pedersen TL, Nookaew I, Wayne Ussery D, M\u00e5nsson M. PanViz: interactive visualization of the structure of functionally annotated pangenomes. Bioinformatics. 2017;33(7):1081\u20132.","journal-title":"Bioinformatics."},{"issue":"10","key":"380_CR67","doi-asserted-by":"publisher","first-page":"3248","DOI":"10.1093\/bioinformatics\/btaa069","volume":"36","author":"M Lovino","year":"2020","unstructured":"Lovino M, Ciaburri MS, Urgese G, Di Cataldo S, Ficarra E. DEEPrior: a deep learning tool for the prioritization of gene fusions. Bioinformatics. 2020;36(10):3248\u201350.","journal-title":"Bioinformatics."},{"key":"380_CR68","doi-asserted-by":"publisher","first-page":"104057","DOI":"10.1016\/j.jbi.2022.104057","volume":"129","author":"M Lovino","year":"2022","unstructured":"Lovino M, Montemurro M, Barrese VS, Ficarra E. Identifying the oncogenic potential of gene fusions exploiting miRNAs. J Biomed Inform. 2022;129:104057.","journal-title":"J Biomed Inform."},{"key":"380_CR69","doi-asserted-by":"crossref","unstructured":"Lovino M, Urgese G, Macii E, Di\u00a0Cataldo S, Ficarra E. Predicting the oncogenic potential of gene fusions using convolutional neural networks. In: Proceedings of CIBB 2018 \u2014 the 15th International Meeting on Computational Intelligence Methods for Bioinformatics and Biostatistics.\u00a0Berlin: Springer; 2018. pp. 277\u201384.","DOI":"10.1007\/978-3-030-34585-3_24"},{"key":"380_CR70","doi-asserted-by":"crossref","unstructured":"Citarrella F, Bontempo G, Lovino M, Ficarra E. FusionFlow: an integrated system workflow for gene fusion detection in genomic samples. In: Proceedings of ADBIS 2022 \u2013 the 26th European Conference on Advances in Databases and Information Systems.\u00a0Berlin: Springer; 2022. pp. 79\u201388.","DOI":"10.1007\/978-3-031-15743-1_8"},{"issue":"6","key":"380_CR71","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1002\/yea.3303","volume":"35","author":"AA Stavrou","year":"2018","unstructured":"Stavrou AA, Mix\u00e3o V, Boekhout T, Gabald\u00f3n T. Misidentification of genome assemblies in public databases: the case of Naumovozyma dairenensis and proposal of a protocol to correct misidentifications. Yeast. 2018;35(6):425\u20139.","journal-title":"Yeast."},{"issue":"1","key":"380_CR72","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1046\/j.1469-8137.2003.00894.x","volume":"160","author":"R Vilgalys","year":"2003","unstructured":"Vilgalys R. Taxonomic misidentification in public DNA databases. New Phytol. 2003;160(1):4\u20135.","journal-title":"New Phytol."},{"key":"380_CR73","doi-asserted-by":"crossref","unstructured":"Lobb B, Tremblay BJM, Moreno-Hagelsieb G, Doxey AC. An assessment of genome annotation coverage across the bacterial tree of life. Microb Genomics. 2020;6(3)1\u201311.","DOI":"10.1099\/mgen.0.000341"},{"key":"380_CR74","doi-asserted-by":"crossref","unstructured":"Qi J, Luo H, Hao B. CVTree: a phylogenetic tree reconstruction tool based on whole genomes. Nucleic Acids Res. 2004;32(suppl_2):W45\u2013W47.","DOI":"10.1093\/nar\/gkh362"},{"issue":"9","key":"380_CR75","doi-asserted-by":"publisher","first-page":"1774","DOI":"10.1111\/1751-7915.14305","volume":"16","author":"C Tarracchini","year":"2023","unstructured":"Tarracchini C, Argentini C, Alessandri G, Lugli GA, Mancabelli L, Fontana F, et al. The core genome evolution of Lactobacillus crispatus as a driving force for niche competition in the human vaginal tract. Microb Biotechnol. 2023;16(9):1774\u201389.","journal-title":"Microb Biotechnol."},{"issue":"10","key":"380_CR76","doi-asserted-by":"publisher","first-page":"1161","DOI":"10.1038\/s41592-021-01254-9","volume":"18","author":"L Wratten","year":"2021","unstructured":"Wratten L, Wilm A, G\u00f6ke J. Reproducible, scalable, and shareable analysis pipelines with bioinformatics workflow managers. Nat Methods. 2021;18(10):1161\u20138.","journal-title":"Nat Methods."},{"issue":"1","key":"380_CR77","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13059-015-0850-7","volume":"16","author":"F Markowetz","year":"2015","unstructured":"Markowetz F. Five selfish reasons to work reproducibly. Genome Biol. 2015;16(1):1\u20134.","journal-title":"Genome Biol."},{"issue":"2","key":"380_CR78","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1038\/nmeth.3252","volume":"12","author":"W Huber","year":"2015","unstructured":"Huber W, Carey VJ, Gentleman R, Anders S, Carlson M, Carvalho BS, et al. Orchestrating high-throughput genomic analysis with Bioconductor. Nat Methods. 2015;12(2):115\u201321.","journal-title":"Nat Methods."},{"issue":"7","key":"380_CR79","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1038\/s41592-018-0046-7","volume":"15","author":"B Gr\u00fcning","year":"2018","unstructured":"Gr\u00fcning B, Dale R, Sj\u00f6din A, Chapman BA, Rowe J, Tomkins-Tinch CH, et al. Bioconda: sustainable and comprehensive software distribution for the life sciences. Nat Methods. 2018;15(7):475\u20136.","journal-title":"Nat Methods."},{"issue":"3","key":"380_CR80","doi-asserted-by":"publisher","first-page":"e1007732","DOI":"10.1371\/journal.pcbi.1007732","volume":"16","author":"G Gautreau","year":"2020","unstructured":"Gautreau G, Bazin A, Gachet M, Planel R, Burlot L, Dubois M, et al. PPanGGOLiN: depicting microbial diversity via a partitioned pangenome graph. PLoS Comput Biol. 2020;16(3):e1007732.","journal-title":"PLoS Comput Biol."},{"key":"380_CR81","doi-asserted-by":"crossref","unstructured":"Bazin A, Gautreau G, M\u00e9digue C, Vallenet D, Calteau A. panRGP: a pangenome-based method to predict genomic islands and explore their diversity. Bioinformatics. 2020;36(Supplement_2):i651\u2013i658.","DOI":"10.1093\/bioinformatics\/btaa792"},{"issue":"18","key":"380_CR82","doi-asserted-by":"publisher","first-page":"4403","DOI":"10.1093\/bioinformatics\/btac506","volume":"38","author":"EM Jonkheer","year":"2022","unstructured":"Jonkheer EM, van Workum DJM, Sheikhizadeh Anari S, Brankovics B, de Haan JR, Berke L, et al. PanTools v3: functional annotation, classification and phylogenomics. Bioinformatics. 2022;38(18):4403\u20135.","journal-title":"Bioinformatics."},{"key":"380_CR83","doi-asserted-by":"crossref","unstructured":"Garrison E, Guarracino A, Heumos S, Villani F, Bao Z, Tattini L, et\u00a0al. Building pangenome graphs. bioRxiv. 2023;05.535718:1\u201314.","DOI":"10.1101\/2023.04.05.535718"},{"issue":"5","key":"380_CR84","doi-asserted-by":"publisher","first-page":"100085","DOI":"10.1016\/j.crmeth.2021.100085","volume":"1","author":"I Ferr\u00e9s","year":"2021","unstructured":"Ferr\u00e9s I, Iraola G. An object-oriented framework for evolutionary pangenome analysis. Cell Rep Methods. 2021;1(5):100085.","journal-title":"Cell Rep Methods."},{"key":"380_CR85","doi-asserted-by":"publisher","unstructured":"Jayanti R, Kim A, Pham S, Raghavan A, Sharma A, Samanta MP. Comparative Analysis of Plastid Genomes Using Pangenome Research ToolKit (PGR-TK). 2023. https:\/\/doi.org\/10.48550\/arXiv.2310.19110.","DOI":"10.48550\/arXiv.2310.19110"},{"key":"380_CR86","unstructured":"GitHub. Pangenome Python repositories. 2024. https:\/\/github.com\/topics\/pangenome?l=python. Accessed 24 Jun."},{"key":"380_CR87","unstructured":"PanGraph jl. A fast, self-contained Julia library and command line tool suite to align multiple genomes into a pangenome graph. 2023. https:\/\/neherlab.github.io\/pangraph\/. Accessed 13 Nov 2023."},{"issue":"13","key":"380_CR88","doi-asserted-by":"publisher","first-page":"3319","DOI":"10.1093\/bioinformatics\/btac308","volume":"38","author":"A Guarracino","year":"2022","unstructured":"Guarracino A, Heumos S, Nahnsen S, Prins P, Garrison E. ODGI: understanding pangenome graphs. Bioinformatics. 2022;38(13):3319\u201326.","journal-title":"Bioinformatics."},{"key":"380_CR89","unstructured":"GitHub. Let\u2019s build from here. 2023. https:\/\/www.github.com. Accessed 4 Nov 2023."},{"key":"380_CR90","unstructured":"GitLab. Software. Faster. 2023. https:\/\/www.gitlab.com. Accessed 4 Nov 2023."},{"issue":"7317","key":"380_CR91","doi-asserted-by":"publisher","first-page":"753","DOI":"10.1038\/467753a","volume":"467","author":"N Barnes","year":"2010","unstructured":"Barnes N. Publish your computer code: it is good enough. Nature. 2010;467(7317):753.","journal-title":"Nature."},{"issue":"1","key":"380_CR92","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1093\/nar\/30.1.207","volume":"30","author":"R Edgar","year":"2002","unstructured":"Edgar R, Domrachev M, Lash AE. Gene Expression Omnibus: NCBI gene expression and hybridization array data repository. Nucleic Acids Res. 2002;30(1):207\u201310.","journal-title":"Nucleic Acids Res."},{"issue":"1","key":"380_CR93","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1093\/nar\/gkg091","volume":"31","author":"A Brazma","year":"2003","unstructured":"Brazma A, Parkinson H, Sarkans U, Shojatalab M, Vilo J, Abeygunawardena N, et al. ArrayExpress-a public repository for microarray gene expression data at the EBI. Nucleic Acids Res. 2003;31(1):68\u201371.","journal-title":"Nucleic Acids Res."},{"issue":"D1","key":"380_CR94","doi-asserted-by":"publisher","first-page":"D54","DOI":"10.1093\/nar\/gkr854","volume":"40","author":"Y Kodama","year":"2012","unstructured":"Kodama Y, Shumway M, Leinonen R. The Sequence Read Archive: explosive growth of sequencing data. Nucleic Acids Res. 2012;40(D1):D54\u20136.","journal-title":"Nucleic Acids Res."},{"key":"380_CR95","unstructured":"Kaggle. Kaggle datasets \u2013 Explore, analyze, and share quality data. 2022. https:\/\/www.kaggle.com\/datasets. Accessed 13 Jul 2023."},{"key":"380_CR96","unstructured":"Figshare. Store, share, discover research. 2011. https:\/\/www.figshare.com. Accessed 13 Jul 2023."},{"key":"380_CR97","unstructured":"Zenodo. Research, shared. 2013. https:\/\/www.zenodo.org. Accessed 13 Jul 2023."},{"key":"380_CR98","unstructured":"University of California Irvine. Machine Learning Repository. 1987. https:\/\/archive.ics.uci.edu\/. Accessed 13 Jul 2023."},{"issue":"1","key":"380_CR99","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/sdata.2016.18","volume":"3","author":"MD Wilkinson","year":"2016","unstructured":"Wilkinson MD, Dumontier M, Aalbersberg IJ, Appleton G, Axton M, Baak A, et al. The FAIR Guiding Principles for scientific data management and stewardship. Sci Data. 2016;3(1):1\u20139.","journal-title":"Sci Data."},{"key":"380_CR100","unstructured":"Scimago. Journal Rank - Biochemistry, genetics, and molecular biology. 2023. https:\/\/scimagojr.com\/journalrank.php?openaccess=true&area=1300. Accessed 13 Nov 2023."}],"container-title":["BioData Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-024-00380-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13040-024-00380-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-024-00380-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T22:02:29Z","timestamp":1725400949000},"score":1,"resource":{"primary":{"URL":"https:\/\/biodatamining.biomedcentral.com\/articles\/10.1186\/s13040-024-00380-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,3]]},"references-count":100,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2024,12]]}},"alternative-id":["380"],"URL":"https:\/\/doi.org\/10.1186\/s13040-024-00380-2","relation":{},"ISSN":["1756-0381"],"issn-type":[{"value":"1756-0381","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9,3]]},"assertion":[{"value":"27 March 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 August 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 September 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"The authors declare no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"28"}}