{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,7]],"date-time":"2026-05-07T05:51:14Z","timestamp":1778133074686,"version":"3.51.4"},"reference-count":80,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T00:00:00Z","timestamp":1733356800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T00:00:00Z","timestamp":1733356800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100000057","name":"U.S. Department of Health & Human Services | NIH | National Institute of General Medical Sciences","doi-asserted-by":"publisher","award":["R35-GM150579"],"award-info":[{"award-number":["R35-GM150579"]}],"id":[{"id":"10.13039\/100000057","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Comput Sci"],"DOI":"10.1038\/s43588-024-00739-9","type":"journal-article","created":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T05:02:20Z","timestamp":1733374940000},"page":"112-124","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["Enabling efficient analysis of biobank-scale data with genotype representation graphs"],"prefix":"10.1038","volume":"5","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-9087-1831","authenticated-orcid":false,"given":"Drew","family":"DeHaas","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9327-1912","authenticated-orcid":false,"given":"Ziqing","family":"Pan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8184-7016","authenticated-orcid":false,"given":"Xinzhu","family":"Wei","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,5]]},"reference":[{"key":"739_CR1","doi-asserted-by":"publisher","unstructured":"Kaiser, J. 200,000 whole genomes made available for biomedical studies by U.K. effort. ScienceInsider https:\/\/doi.org\/10.1126\/science.acx9678 (2021).","DOI":"10.1126\/science.acx9678"},{"key":"739_CR2","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1016\/j.ajhg.2022.11.008","volume":"110","author":"BL Browning","year":"2023","unstructured":"Browning, B. L. & Browning, S. R. Statistical phasing of 150,119 sequenced genomes in the UK Biobank. Am. J. Hum. Genet. 110, 161\u2013165 (2023).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR3","doi-asserted-by":"publisher","first-page":"1243","DOI":"10.1038\/s41588-023-01415-w","volume":"55","author":"RJ Hofmeister","year":"2023","unstructured":"Hofmeister, R. J., Ribeiro, D. M., Rubinacci, S. & Delaneau, O. Accurate rare variant phasing of whole-genome and whole-exome sequencing data in the UK Biobank. Nat. Genet. 55, 1243\u20131249 (2023).","journal-title":"Nat. Genet."},{"key":"739_CR4","doi-asserted-by":"publisher","first-page":"2156","DOI":"10.1093\/bioinformatics\/btr330","volume":"27","author":"P Danecek","year":"2011","unstructured":"Danecek, P. et al. The variant call format and VCFtools. Bioinformatics 27, 2156\u20132158 (2011).","journal-title":"Bioinformatics"},{"key":"739_CR5","doi-asserted-by":"publisher","unstructured":"Band, G. & Marchini, J. BGEN: a binary file format for imputed genotype and haplotype data. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/308296 (2018).","DOI":"10.1101\/308296"},{"key":"739_CR6","doi-asserted-by":"publisher","first-page":"2987","DOI":"10.1093\/bioinformatics\/btr509","volume":"27","author":"H Li","year":"2011","unstructured":"Li, H. A statistical framework for SNP calling, mutation discovery, association mapping and population genetical parameter estimation from sequencing data. Bioinformatics 27, 2987\u20132993 (2011).","journal-title":"Bioinformatics"},{"key":"739_CR7","doi-asserted-by":"publisher","first-page":"559","DOI":"10.1086\/519795","volume":"81","author":"S Purcell","year":"2007","unstructured":"Purcell, S. et al. PLINK: a tool set for whole-genome association and population-based linkage analyses. Am. J. Hum. Genet. 81, 559\u2013575 (2007).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR8","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1038\/nmeth.3654","volume":"13","author":"RM Layer","year":"2016","unstructured":"Layer, R. M., Kindlon, N., Karczewski, K. J., Consortium, E. A. & Quinlan, A. R. Efficient genotype compression and analysis of large genetic-variation data sets. Nat. Methods 13, 63\u201365 (2016).","journal-title":"Nat. Methods"},{"key":"739_CR9","doi-asserted-by":"publisher","first-page":"1834","DOI":"10.1093\/bioinformatics\/bty023","volume":"34","author":"A Danek","year":"2018","unstructured":"Danek, A. & Deorowicz, S. GTC: how to maintain huge genotype collections in a compressed form. Bioinformatics 34, 1834\u20131840 (2018).","journal-title":"Bioinformatics"},{"key":"739_CR10","doi-asserted-by":"publisher","first-page":"338","DOI":"10.1016\/j.ajhg.2018.07.015","volume":"103","author":"BL Browning","year":"2018","unstructured":"Browning, B. L., Zhou, Y. & Browning, S. R. A one-penny imputed genome from next-generation reference panels. Am. J. Hum. Genet. 103, 338\u2013348 (2018).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR11","doi-asserted-by":"publisher","first-page":"4791","DOI":"10.1093\/bioinformatics\/btz508","volume":"35","author":"S Deorowicz","year":"2019","unstructured":"Deorowicz, S. & Danek, A. GTShark: genotype compression in large projects. Bioinformatics 35, 4791\u20134793 (2019).","journal-title":"Bioinformatics"},{"key":"739_CR12","doi-asserted-by":"publisher","first-page":"2225","DOI":"10.1093\/bioinformatics\/btab102","volume":"37","author":"D Lan","year":"2021","unstructured":"Lan, D., Tobler, R., Souilmi, Y. & Llamas, B. Genozip: a universal extensible genomic data compressor. Bioinformatics 37, 2225\u20132230 (2021).","journal-title":"Bioinformatics"},{"key":"739_CR13","doi-asserted-by":"publisher","first-page":"4248","DOI":"10.1093\/bioinformatics\/btab378","volume":"37","author":"J LeFaive","year":"2021","unstructured":"LeFaive, J., Smith, A. V., Kang, H. M. & Abecasis, G. Sparse allele vectors and the savvy software suite. Bioinformatics 37, 4248\u20134250 (2021).","journal-title":"Bioinformatics"},{"key":"739_CR14","doi-asserted-by":"publisher","first-page":"3778","DOI":"10.1093\/bioinformatics\/btac413","volume":"38","author":"R Wertenbroek","year":"2022","unstructured":"Wertenbroek, R., Rubinacci, S., Xenarios, I., Thoma, Y. & Delaneau, O. XSI\u2014a genotype compression tool for compressive genomics in large biobanks. Bioinformatics 38, 3778\u20133784 (2022).","journal-title":"Bioinformatics"},{"key":"739_CR15","doi-asserted-by":"publisher","unstructured":"Rivas, M. A. & Chang, C. Efficient storage and regression computation for population-scale genome sequencing studies. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/2024.04.11.589062 (2024).","DOI":"10.1101\/2024.04.11.589062"},{"key":"739_CR16","doi-asserted-by":"publisher","first-page":"1266","DOI":"10.1093\/bioinformatics\/btu014","volume":"30","author":"R Durbin","year":"2014","unstructured":"Durbin, R. Efficient haplotype matching and storage using the positional Burrows\u2013Wheeler transform (PBWT). Bioinformatics 30, 1266\u20131272 (2014).","journal-title":"Bioinformatics"},{"key":"739_CR17","doi-asserted-by":"crossref","unstructured":"Wu, K., Otoo, EJ. & Shoshani, A. A performance comparison of bitmap indexes. In Proc. of the Tenth International Conference on Information and Knowledge Management 559\u2013561 (ACM, 2001).","DOI":"10.1145\/502585.502689"},{"key":"739_CR18","doi-asserted-by":"publisher","unstructured":"Collet, Y. & Kucherawy, M. RFC8878: zstandard compression and the \u2018application\/Zstd\u2019 media type. RFC Editor https:\/\/doi.org\/10.17487\/RFC8878 (2021).","DOI":"10.17487\/RFC8878"},{"key":"739_CR19","doi-asserted-by":"publisher","first-page":"428","DOI":"10.1038\/s41576-020-0233-0","volume":"21","author":"P Kapli","year":"2020","unstructured":"Kapli, P., Yang, Z. & Telford, M. J. Phylogenetic tree building in the genomic age. Nat. Rev. Genet. 21, 428\u2013444 (2020).","journal-title":"Nat. Rev. Genet."},{"key":"739_CR20","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1126\/science.155.3760.279","volume":"155","author":"WM Fitch","year":"1967","unstructured":"Fitch, W. M. & Margoliash, E. Construction of phylogenetic trees. Science 155, 279\u2013284 (1967).","journal-title":"Science"},{"key":"739_CR21","doi-asserted-by":"publisher","first-page":"809","DOI":"10.1038\/s41588-021-00862-7","volume":"53","author":"Y Turakhia","year":"2021","unstructured":"Turakhia, Y. et al. Ultrafast Sample placement on Existing tRees (UShER) enables real-time phylogenetics for the SARS-CoV-2 pandemic. Nat. Genet. 53, 809\u2013816 (2021).","journal-title":"Nat. Genet."},{"key":"739_CR22","doi-asserted-by":"publisher","first-page":"254","DOI":"10.1093\/molbev\/msj030","volume":"23","author":"DH Huson","year":"2006","unstructured":"Huson, D. H. & Bryant, D. Application of phylogenetic networks in evolutionary studies. Mol. Biol. Evol. 23, 254\u2013267 (2006).","journal-title":"Mol. Biol. Evol."},{"key":"739_CR23","doi-asserted-by":"publisher","first-page":"iyac044","DOI":"10.1093\/genetics\/iyac044","volume":"221","author":"YC Brandt","year":"2022","unstructured":"Brandt, Y. C., Wei, X. D., Deng, Y., Vaughn, A. H. & Nielsen, R. Evaluation of methods for estimating coalescence times using ancestral recombination graphs. Genetics 221, iyac044 (2022).","journal-title":"Genetics"},{"key":"739_CR24","doi-asserted-by":"publisher","first-page":"evae005","DOI":"10.1093\/gbe\/evae005","volume":"16","author":"DYC Brandt","year":"2024","unstructured":"Brandt, D. Y. C., Huber, C. D., Chiang, C. W. K. & Ortega-Del Vecchyo, D. The promise of inferring the past using the ancestral recombination graph. Genome Biol. Evol. 16, evae005 (2024).","journal-title":"Genome Biol. Evol."},{"key":"739_CR25","doi-asserted-by":"publisher","first-page":"e1011110","DOI":"10.1371\/journal.pgen.1011110","volume":"20","author":"AL Lewanski","year":"2024","unstructured":"Lewanski, A. L., Grundler, M. C. & Bradburd, G. S. The era of the ARG: an introduction to ancestral recombination graphs and their significance in empirical evolutionary genomics. PLoS Genet. 20, e1011110 (2024).","journal-title":"PLoS Genet."},{"key":"739_CR26","doi-asserted-by":"publisher","first-page":"iyae100","DOI":"10.1093\/genetics\/iyae100","volume":"228","author":"Y Wong","year":"2024","unstructured":"Wong, Y. et al. A general and efficient representation of ancestral recombination graphs. Genetics 228, iyae100 (2024).","journal-title":"Genetics"},{"key":"739_CR27","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1016\/0040-5809(83)90013-8","volume":"23","author":"RR Hudson","year":"1983","unstructured":"Hudson, R. R. Properties of a neutral allele model with intragenic recombination. Theor. Popul. Biol. 23, 183\u2013201 (1983).","journal-title":"Theor. Popul. Biol."},{"key":"739_CR28","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1016\/0040-5809(84)90027-3","volume":"26","author":"S Tavar\u00e9","year":"1984","unstructured":"Tavar\u00e9, S. Line-of-descent and genealogical processes, and their applications in population genetics models. Theor. Popul. Biol. 26, 119\u2013164 (1984).","journal-title":"Theor. Popul. Biol."},{"key":"739_CR29","doi-asserted-by":"publisher","first-page":"768","DOI":"10.1038\/s41588-023-01379-x","volume":"55","author":"BC Zhang","year":"2023","unstructured":"Zhang, B. C., Biddanda, A., Gunnarsson, \u00c1. F., Cooper, F. & Palamara, P. F. Biobank-scale inference of ancestral recombination graphs enables genealogical analysis of complex traits. Nat. Genet. 55, 768\u2013776 (2023).","journal-title":"Nat. Genet."},{"key":"739_CR30","doi-asserted-by":"publisher","first-page":"e1004342","DOI":"10.1371\/journal.pgen.1004342","volume":"10","author":"MD Rasmussen","year":"2014","unstructured":"Rasmussen, M. D., Hubisz, M. J., Gronau, I. & Siepel, A. Genome-wide inference of ancestral recombination graphs. PLoS Genet. 10, e1004342 (2014).","journal-title":"PLoS Genet."},{"key":"739_CR31","doi-asserted-by":"publisher","first-page":"1321","DOI":"10.1038\/s41588-019-0484-x","volume":"51","author":"L Speidel","year":"2019","unstructured":"Speidel, L., Forest, M., Shi, S. & Myers, S. R. A method for genome-wide genealogy estimation for thousands of samples. Nat. Genet. 51, 1321\u20131329 (2019).","journal-title":"Nat. Genet."},{"key":"739_CR32","doi-asserted-by":"publisher","first-page":"1330","DOI":"10.1038\/s41588-019-0483-y","volume":"51","author":"J Kelleher","year":"2019","unstructured":"Kelleher, J. et al. Inferring whole-genome histories in large population datasets. Nat. Genet. 51, 1330\u20131338 (2019).","journal-title":"Nat. Genet."},{"key":"739_CR33","doi-asserted-by":"publisher","first-page":"909","DOI":"10.1038\/nbt0704-909","volume":"22","author":"SR Eddy","year":"2004","unstructured":"Eddy, S. R. What is dynamic programming? Nat. Biotechnol. 22, 909\u2013910 (2004).","journal-title":"Nat. Biotechnol."},{"key":"739_CR34","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1097\/00001648-199901000-00008","volume":"10","author":"S Greenland","year":"1999","unstructured":"Greenland, S., Pearl, J. & Robins, J. M. Causal diagrams for epidemiologic research. Epidemiology 10, 37\u201348 (1999).","journal-title":"Epidemiology"},{"key":"739_CR35","doi-asserted-by":"publisher","first-page":"e1004842","DOI":"10.1371\/journal.pcbi.1004842","volume":"12","author":"J Kelleher","year":"2016","unstructured":"Kelleher, J., Etheridge, A. M. & McVean, G. Efficient coalescent simulation and genealogical analysis for large sample sizes. PLoS Comput. Biol. 12, e1004842 (2016).","journal-title":"PLoS Comput. Biol."},{"key":"739_CR36","doi-asserted-by":"publisher","DOI":"10.1093\/genetics\/iyab229","volume":"220","author":"F Baumdicker","year":"2022","unstructured":"Baumdicker, F. et al. Efficient ancestry and mutation simulation with msprime 1.0. Genetics 220, iyab229 (2022).","journal-title":"Genetics"},{"key":"739_CR37","doi-asserted-by":"publisher","first-page":"665","DOI":"10.1093\/bioinformatics\/16.8.665","volume":"16","author":"R Giegerich","year":"2000","unstructured":"Giegerich, R. A systematic approach to dynamic programming in bioinformatics. Bioinformatics 16, 665\u2013677 (2000).","journal-title":"Bioinformatics"},{"key":"739_CR38","doi-asserted-by":"publisher","first-page":"779","DOI":"10.1534\/genetics.120.303253","volume":"215","author":"P Ralph","year":"2020","unstructured":"Ralph, P., Thornton, K. & Kelleher, J. Efficiently summarizing relationships in large samples: a general duality between statistics of genealogies and genomes. Genetics 215, 779\u2013797 (2020).","journal-title":"Genetics"},{"key":"739_CR39","unstructured":"Cormen, T. H., Leiserson, C. E., Rivest, R. L. & Stein, C. Introduction to Algorithms (MIT Press, 2022)."},{"key":"739_CR40","doi-asserted-by":"publisher","first-page":"1168","DOI":"10.1093\/bioinformatics\/bts086","volume":"28","author":"V Stei\u00df","year":"2012","unstructured":"Stei\u00df, V., Letschert, T., Sch\u00e4fer, H. & Pahl, R. PERMORY-MPI: a program for high-speed parallel permutation testing in genome-wide association studies. Bioinformatics 28, 1168\u20131169 (2012).","journal-title":"Bioinformatics"},{"key":"739_CR41","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1186\/s13742-015-0047-8","volume":"4","author":"CC Chang","year":"2015","unstructured":"Chang, C. C. et al. Second-generation PLINK: rising to the challenge of larger and richer datasets. GigaSci 4, 7 (2015).","journal-title":"GigaSci"},{"key":"739_CR42","unstructured":"Purcell, S. & Chang, C. PLINK [1.90b626]. https:\/\/www.cog-genomics.org\/plink\/1.9 (2022)."},{"key":"739_CR43","doi-asserted-by":"publisher","first-page":"e1006581","DOI":"10.1371\/journal.pcbi.1006581","volume":"14","author":"J Kelleher","year":"2018","unstructured":"Kelleher, J., Thornton, K. R., Ashander, J. & Ralph, P. L. Efficient pedigree recording for fast population genetics simulation. PLoS Comput. Biol. 14, e1006581 (2018).","journal-title":"PLoS Comput. Biol."},{"key":"739_CR44","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1016\/j.ajhg.2017.06.005","volume":"101","author":"PM Visscher","year":"2017","unstructured":"Visscher, P. M. et al.10 years of GWAS discovery: biology, function and translation. Am. J. Hum. Genet. 101, 5\u201322 (2017).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR45","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1016\/j.ajhg.2022.12.011","volume":"110","author":"A Abdellaoui","year":"2023","unstructured":"Abdellaoui, A., Yengo, L., Verweij, K. J. H. & Visscher, P. M. 15 years of GWAS discovery: realizing the promise. Am. J. Hum. Genet. 110, 179\u2013194 (2023).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR46","doi-asserted-by":"publisher","first-page":"627","DOI":"10.1038\/nbt.2241","volume":"30","author":"P-R Loh","year":"2012","unstructured":"Loh, P.-R., Baym, M. & Berger, B. Compressive genomics. Nat. Biotechnol. 30, 627\u2013630 (2012).","journal-title":"Nat. Biotechnol."},{"key":"739_CR47","doi-asserted-by":"crossref","unstructured":"Furnas, G. W. & Zacks, J. Multitrees: enriching and reusing hierarchical structure. In Proc. SIGCHI conference on Human factors in Computing Systems Celebrating Interdependence 330\u2013336 (ACM, 1994).","DOI":"10.1145\/191666.191778"},{"key":"739_CR48","unstructured":"Wakeley, J. Coalescent Theory: An Introduction (Roberts & Co, 2009)."},{"key":"739_CR49","doi-asserted-by":"publisher","first-page":"203","DOI":"10.2307\/2408186","volume":"37","author":"RR Hudson","year":"1983","unstructured":"Hudson, R. R. Testing the constant-rate neutral allele model with protein sequence data. Evolution 37, 203\u2013217 (1983).","journal-title":"Evolution"},{"key":"739_CR50","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1016\/j.ygeno.2007.05.011","volume":"90","author":"IW Saunders","year":"2007","unstructured":"Saunders, I. W., Brohede, J. & Hannan, G. N. Estimating genotyping error rates from Mendelian errors in SNP array genotypes and their impact on inference. Genomics 90, 291\u2013296 (2007).","journal-title":"Genomics"},{"key":"739_CR51","doi-asserted-by":"publisher","first-page":"847","DOI":"10.1016\/j.ajhg.2009.11.004","volume":"85","author":"BL Browning","year":"2009","unstructured":"Browning, B. L. & Yu, Z. Simultaneous genotype calling and haplotype phasing improves genotype accuracy and reduces false-positive associations for genome-wide association studies. Am. J. Hum. Genet. 85, 847\u2013861 (2009).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR52","doi-asserted-by":"publisher","first-page":"732","DOI":"10.1038\/s41586-022-04965-x","volume":"607","author":"BV Halldorsson","year":"2022","unstructured":"Halldorsson, B. V. et al. The sequences of 150,119 genomes in the UK Biobank. Nature 607, 732\u2013740 (2022).","journal-title":"Nature"},{"key":"739_CR53","first-page":"1","volume":"7","author":"RR Hudson","year":"1990","unstructured":"Hudson, R. R. Gene genealogies and the coalescent process. Oxf. Surv. Evol. Biol. 7, 1\u201344 (1990).","journal-title":"Oxf. Surv. Evol. Biol."},{"key":"739_CR54","doi-asserted-by":"publisher","first-page":"479","DOI":"10.1089\/cmb.1996.3.479","volume":"3","author":"RC Griffiths","year":"1996","unstructured":"Griffiths, R. C. & Marjoram, P. Ancestral inference from samples of DNA sequences with recombination. J. Comput. Biol. 3, 479\u2013502 (1996).","journal-title":"J. Comput. Biol."},{"key":"739_CR55","doi-asserted-by":"crossref","unstructured":"Griffiths, R. C. & Marjoram, P. An ancestral recombination graph. Prog. Popul. Genet. Hum. Evol. 257\u2013270 (1997).","DOI":"10.1007\/978-1-4757-2609-1_16"},{"key":"739_CR56","doi-asserted-by":"publisher","first-page":"477","DOI":"10.1038\/nrg2361","volume":"9","author":"M Slatkin","year":"2008","unstructured":"Slatkin, M. Linkage disequilibrium\u2014understanding the evolutionary past and mapping the medical future. Nat. Rev. Genet. 9, 477\u2013485 (2008).","journal-title":"Nat. Rev. Genet."},{"key":"739_CR57","doi-asserted-by":"publisher","first-page":"1494","DOI":"10.1038\/s41588-023-01487-8","volume":"55","author":"P Salehi Nowbandegani","year":"2023","unstructured":"Salehi Nowbandegani, P. et al. Extremely sparse models of linkage disequilibrium in ancestrally diverse association studies. Nat. Genet. 55, 1494\u20131502 (2023).","journal-title":"Nat. Genet."},{"key":"739_CR58","doi-asserted-by":"publisher","first-page":"703","DOI":"10.1038\/nrg3054","volume":"12","author":"SR Browning","year":"2011","unstructured":"Browning, S. R. & Browning, B. L. Haplotype phasing: existing methods and new developments. Nat. Rev. Genet. 12, 703\u2013714 (2011).","journal-title":"Nat. Rev. Genet."},{"key":"739_CR59","doi-asserted-by":"publisher","first-page":"1709","DOI":"10.1093\/bib\/bby044","volume":"20","author":"E Geza","year":"2019","unstructured":"Geza, E. et al. A comprehensive survey of models for dissecting local ancestry deconvolution in human genome. Brief. Bioinform. 20, 1709\u20131724 (2019).","journal-title":"Brief. Bioinform."},{"key":"739_CR60","doi-asserted-by":"publisher","first-page":"1097","DOI":"10.1038\/s41588-021-00870-7","volume":"53","author":"J Mbatchou","year":"2021","unstructured":"Mbatchou, J. et al. Computationally efficient whole-genome regression for quantitative and binary traits. Nat. Genet. 53, 1097\u20131103 (2021).","journal-title":"Nat. Genet."},{"key":"739_CR61","unstructured":"Gray, AG., Moore, AW., Nichol RC., Connolly, AJ., Genovese, C. & Wasserman, L. Multi-Tree Methods for Statistics on Very Large Datasets in Astronomy. In Twenty Years of ADASS: A Retrospective of the First Twenty Years of the Astronomical Data Analysis Software and Systems Conference Series (eds F. Ochsenbein et al.) 314 (Astronomical Society of the Pacific, 2014)."},{"key":"739_CR62","unstructured":"Waggener, W. N. Pulse Code Modulation Techniques: With Applications in Communications and Data Recording (Van Nostrand Reinhold, 1995)."},{"key":"739_CR63","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1016\/j.ygeno.2010.03.001","volume":"95","author":"JR Miller","year":"2010","unstructured":"Miller, J. R., Koren, S. & Sutton, G. Assembly algorithms for next-generation sequencing data. Genomics 95, 315\u2013327 (2010).","journal-title":"Genomics"},{"key":"739_CR64","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1145\/362686.362692","volume":"13","author":"BH Bloom","year":"1970","unstructured":"Bloom, B. H. Space\/time trade-offs in hash coding with allowable errors. Commun. ACM 13, 422\u2013426 (1970).","journal-title":"Commun. ACM"},{"key":"739_CR65","doi-asserted-by":"publisher","first-page":"230","DOI":"10.1145\/362003.362025","volume":"16","author":"WA Burkhard","year":"1973","unstructured":"Burkhard, W. A. & Keller, R. M. Some approaches to best-match file searching. Commun. ACM 16, 230\u2013236 (1973).","journal-title":"Commun. ACM"},{"key":"739_CR66","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1137\/1026055","volume":"26","author":"IS Duff","year":"1984","unstructured":"Duff, I. S. Computer solution of large sparse positive definite systems (Alan George and Joseph W. Liu). SIAM Rev. 26, 289\u2013291 (1984).","journal-title":"SIAM Rev."},{"key":"739_CR67","doi-asserted-by":"crossref","unstructured":"Bulu\u00e7, A., Fineman, J. T., Frigo, M., Gilbert, J. R. & Leiserson, C. E. Parallel sparse matrix-vector and matrix-transpose-vector multiplication using compressed sparse blocks. In Proc. Twenty-first Annual Symposium on Parallelism in Algorithms and Architectures 233\u2013244 (ACM, 2009).","DOI":"10.1145\/1583991.1584053"},{"key":"739_CR68","doi-asserted-by":"crossref","unstructured":"Brandes, U., Eiglsperger, M., Herman, I., Himsolt, M. & Marshall, M. S. in Graph Drawing (eds Mutzel, P. et al.) Vol. 2265, 501\u2013512 (Springer, 2002).","DOI":"10.1007\/3-540-45848-4_59"},{"key":"739_CR69","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1038\/nature15393","volume":"526","author":"The 1000 Genomes Project Consortium.","year":"2015","unstructured":"The 1000 Genomes Project Consortium. A global reference for human genetic variation. Nature 526, 68\u201374 (2015).","journal-title":"Nature"},{"key":"739_CR70","doi-asserted-by":"publisher","first-page":"1297","DOI":"10.1101\/gr.107524.110","volume":"20","author":"A McKenna","year":"2010","unstructured":"McKenna, A. et al. The Genome Analysis Toolkit: a MapReduce framework for analyzing next-generation DNA sequencing data. Genome Res. 20, 1297\u20131303 (2010).","journal-title":"Genome Res."},{"key":"739_CR71","doi-asserted-by":"publisher","first-page":"1654","DOI":"10.1038\/ng.3964","volume":"49","author":"HP Eggertsson","year":"2017","unstructured":"Eggertsson, H. P. et al. Graphtyper enables population-scale genotyping using pangenome graphs. Nat. Genet. 49, 1654\u20131660 (2017).","journal-title":"Nat. Genet."},{"key":"739_CR72","unstructured":"Ribeiro, D., Hofmeister, R., Rubinacci, S. & Delaneau, O. Phasing of the UK Biobank whole genome sequencing data interim release of 200,031 samples (2023)."},{"key":"739_CR73","unstructured":"GNU Scientific Library Reference Manual: For GSL Version 1.12. (Network Theory, 2009)."},{"key":"739_CR74","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1016\/j.ajhg.2010.11.011","volume":"88","author":"J Yang","year":"2011","unstructured":"Yang, J., Lee, S. H., Goddard, M. E. & Visscher, P. M. GCTA: a tool for genome-wide complex trait analysis. Am. J. Hum. Genet. 88, 76\u201382 (2011).","journal-title":"Am. J. Hum. Genet."},{"key":"739_CR75","doi-asserted-by":"publisher","first-page":"1867","DOI":"10.1093\/bioinformatics\/btx057","volume":"33","author":"BS Pedersen","year":"2017","unstructured":"Pedersen, B. S. & Quinlan, A. R. cyvcf2: fast, flexible variant analysis with Python. Bioinformatics 33, 1867\u20131869 (2017).","journal-title":"Bioinformatics"},{"key":"739_CR76","doi-asserted-by":"publisher","first-page":"27","DOI":"10.2307\/3213548","volume":"19","author":"JFC Kingman","year":"1982","unstructured":"Kingman, J. F. C. On the genealogy of large populations. J. Appl. Probab. 19, 27\u201343 (1982).","journal-title":"J. Appl. Probab."},{"key":"739_CR77","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1016\/0304-4149(82)90011-4","volume":"13","author":"JFC Kingman","year":"1982","unstructured":"Kingman, J. F. C. The coalescent. Stoch. Process. Their Appl. 13, 235\u2013248 (1982).","journal-title":"Stoch. Process. Their Appl."},{"key":"739_CR78","doi-asserted-by":"publisher","unstructured":"Zhan, SH., Ignatieva, A., Wong, Y., et al. Towards pandemic-scale ancestral recombination graphs of SARS-CoV-2. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/2023.06.08.544212 (2023).","DOI":"10.1101\/2023.06.08.544212"},{"key":"739_CR79","doi-asserted-by":"publisher","unstructured":"GISAID (GISAID); https:\/\/doi.org\/10.55876\/gis8.230329cd (2023).","DOI":"10.55876\/gis8.230329cd"},{"key":"739_CR80","doi-asserted-by":"publisher","unstructured":"DeHaas, D. & Pan, Z. aprilweilab\/grgl: GRG paper version. Zenodo https:\/\/doi.org\/10.5281\/zenodo.14002478 (2024).","DOI":"10.5281\/zenodo.14002478"}],"container-title":["Nature Computational Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s43588-024-00739-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-024-00739-9","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-024-00739-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,25]],"date-time":"2025-02-25T18:02:20Z","timestamp":1740506540000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s43588-024-00739-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,5]]},"references-count":80,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2025,2]]}},"alternative-id":["739"],"URL":"https:\/\/doi.org\/10.1038\/s43588-024-00739-9","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2024.04.23.590800","asserted-by":"object"}]},"ISSN":["2662-8457"],"issn-type":[{"value":"2662-8457","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,5]]},"assertion":[{"value":"8 May 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 November 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 December 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}