{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T01:12:30Z","timestamp":1774487550516,"version":"3.50.1"},"reference-count":25,"publisher":"Oxford University Press (OUP)","issue":"1","license":[{"start":{"date-parts":[[2024,1,4]],"date-time":"2024-01-04T00:00:00Z","timestamp":1704326400000},"content-version":"vor","delay-in-days":3,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R00MH117165"],"award-info":[{"award-number":["R00MH117165"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01MH126933"],"award-info":[{"award-number":["R01MH126933"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000893","name":"Simons Foundation","doi-asserted-by":"publisher","award":["#734069"],"award-info":[{"award-number":["#734069"]}],"id":[{"id":"10.13039\/100000893","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,1,2]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>de novo variants (DNVs) are variants that are present in offspring but not in their parents. DNVs are both important for examining mutation rates as well as in the identification of disease-related variation. While efforts have been made to call DNVs, calling of DNVs is still challenging from parent\u2013child sequenced trio data. We developed Hare And Tortoise (HAT) as an automated DNV detection workflow for highly accurate short-read and long-read sequencing data. Reliable detection of DNVs is important for human genomics and HAT addresses this need.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>HAT is a computational workflow that begins with aligned read data (i.e. CRAM or BAM) from a parent\u2013child sequenced trio and outputs DNVs. HAT detects high-quality DNVs from Illumina short-read whole-exome sequencing, Illumina short-read whole-genome sequencing, and highly accurate PacBio HiFi long-read whole-genome sequencing data. The quality of these DNVs is high based on a series of quality metrics including number of DNVs per individual, percent of DNVs at CpG sites, and percent of DNVs phased to the paternal chromosome of origin.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>https:\/\/github.com\/TNTurnerLab\/HAT<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btad775","type":"journal-article","created":{"date-parts":[[2024,1,2]],"date-time":"2024-01-02T13:48:48Z","timestamp":1704203328000},"source":"Crossref","is-referenced-by-count":10,"title":["HAT: <i>de novo<\/i> variant calling for highly accurate short-read and long-read sequencing data"],"prefix":"10.1093","volume":"40","author":[{"given":"Jeffrey K","family":"Ng","sequence":"first","affiliation":[{"name":"Department of Genetics, Washington University School of Medicine , St Louis, MO 63110, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8246-6477","authenticated-orcid":false,"given":"Tychele N","family":"Turner","sequence":"additional","affiliation":[{"name":"Department of Genetics, Washington University School of Medicine , St Louis, MO 63110, USA"}]}],"member":"286","published-online":{"date-parts":[[2024,1,4]]},"reference":[{"key":"2024011010212342300_btad775-B1","doi-asserted-by":"crossref","first-page":"966","DOI":"10.1038\/nmeth.3505","article-title":"SpeedSeq: ultra-fast personal genome analysis and interpretation","volume":"12","author":"Chiang","year":"2015","journal-title":"Nat Methods"},{"key":"2024011010212342300_btad775-B20","doi-asserted-by":"crossref","first-page":"488","DOI":"10.1016\/j.neuron.2018.01.015","article-title":"SPARK: a US cohort of 50,000 families to accelerate autism research","volume":"97","author":"Feliciano","year":"2018","journal-title":"Neuron"},{"key":"2024011010212342300_btad775-B2","doi-asserted-by":"crossref","first-page":"e10","DOI":"10.5808\/GI.2020.18.1.e10","article-title":"Accelerating next generation sequencing data analysis: an evaluation of optimized best practices for Genome Analysis Toolkit algorithms","volume":"18","author":"Franke","year":"2020","journal-title":"Genomics Inform"},{"key":"2024011010212342300_btad775-B3","doi-asserted-by":"crossref","first-page":"216","DOI":"10.1038\/nature13908","article-title":"The contribution of de novo coding mutations to autism spectrum disorder","volume":"515","author":"Iossifov","year":"2014","journal-title":"Nature"},{"key":"2024011010212342300_btad775-B4","author":"Kolesnikov","year":"2021"},{"key":"2024011010212342300_btad775-B5","doi-asserted-by":"crossref","first-page":"471","DOI":"10.1038\/nature11396","article-title":"Rate of de novo mutations and the importance of father's age to disease risk","volume":"488","author":"Kong","year":"2012","journal-title":"Nature"},{"key":"2024011010212342300_btad775-B6","doi-asserted-by":"crossref","first-page":"2520","DOI":"10.1093\/bioinformatics\/bts480","article-title":"Snakemake\u2014a scalable bioinformatics workflow engine","volume":"28","author":"Koster","year":"2012","journal-title":"Bioinformatics"},{"key":"2024011010212342300_btad775-B7","doi-asserted-by":"crossref","first-page":"555","DOI":"10.1038\/s41587-019-0054-x","article-title":"Best practices for benchmarking germline small-variant calls in human genomes","volume":"37","author":"Krusche","year":"2019","journal-title":"Nat Biotechnol"},{"key":"2024011010212342300_btad775-B8","doi-asserted-by":"crossref","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","article-title":"The sequence alignment\/map format and SAMtools","volume":"25","author":"Li","year":"2009","journal-title":"Bioinformatics"},{"key":"2024011010212342300_btad775-B9","doi-asserted-by":"crossref","first-page":"3640","DOI":"10.1093\/bioinformatics\/btab225","article-title":"Customized de novo mutation detection for any variant calling pipeline: synthDNM","volume":"37","author":"Lian","year":"2021","journal-title":"Bioinformatics"},{"key":"2024011010212342300_btad775-B10","doi-asserted-by":"crossref","first-page":"1297","DOI":"10.1101\/gr.107524.110","article-title":"The Genome Analysis Toolkit: a MapReduce framework for analyzing next-generation DNA sequencing data","volume":"20","author":"McKenna","year":"2010","journal-title":"Genome Res"},{"key":"2024011010212342300_btad775-B11","first-page":"2071","article-title":"Germline mosaicism of a missense variant in KCNC2 in a multiplex family with autism and epilepsy characterized by long-read sequencing","volume":"188","author":"Mehinovic","year":"2022"},{"key":"2024011010212342300_btad775-B12","first-page":"2","article-title":"Docker: lightweight linux containers for consistent development and deployment","volume":"239","author":"Merkel","year":"2014","journal-title":"Linux J"},{"key":"2024011010212342300_btad775-B13","doi-asserted-by":"crossref","first-page":"1431","DOI":"10.1016\/j.cell.2012.11.019","article-title":"Whole-genome sequencing in autism identifies hot spots for de novo germline mutation","volume":"151","author":"Michaelson","year":"2012","journal-title":"Cell"},{"key":"2024011010212342300_btad775-B14","doi-asserted-by":"crossref","first-page":"1979","DOI":"10.1002\/humu.24455","article-title":"de novo variant calling identifies cancer mutation signatures in the 1000 Genomes Project","volume":"43","author":"Ng","year":"2022","journal-title":"Hum Mutat"},{"key":"2024011010212342300_btad775-B15","doi-asserted-by":"crossref","first-page":"631","DOI":"10.1016\/j.ajhg.2022.02.014","article-title":"Familial long-read sequencing increases yield of de novo mutations","volume":"109","author":"Noyes","year":"2022","journal-title":"Am J Hum Genet"},{"key":"2024011010212342300_btad775-B16","doi-asserted-by":"crossref","first-page":"983","DOI":"10.1038\/nbt.4235","article-title":"A universal SNP and small-indel variant caller using deep neural networks","volume":"36","author":"Poplin","year":"2018","journal-title":"Nat Biotechnol"},{"key":"2024011010212342300_btad775-B17","first-page":"201178","author":"Poplin","year":"2018"},{"key":"2024011010212342300_btad775-B18","first-page":"100081","article-title":"From karyotypes to precision genomics in 9p deletion and duplication syndromes","volume":"3","author":"Sams","year":"2022","journal-title":"HGG Adv"},{"key":"2024011010212342300_btad775-B19","doi-asserted-by":"crossref","first-page":"47","DOI":"10.1146\/annurev-genom-031714-125740","article-title":"Determinants of mutation rate variation in the human germline","volume":"15","author":"S\u00e9gurel","year":"2014","journal-title":"Annu Rev Genomics Hum Genet"},{"key":"2024011010212342300_btad775-B21","doi-asserted-by":"crossref","first-page":"lqab019","DOI":"10.1093\/nargab\/lqab019","article-title":"Sequencing error profiles of Illumina sequencing instruments","volume":"3","author":"Stoler","year":"2021","journal-title":"NAR Genom Bioinform"},{"key":"2024011010212342300_btad775-B22","doi-asserted-by":"crossref","first-page":"710","DOI":"10.1016\/j.cell.2017.08.047","article-title":"Genomic patterns of de novo mutation in simplex autism","volume":"171","author":"Turner","year":"2017","journal-title":"Cell"},{"key":"2024011010212342300_btad775-B23","doi-asserted-by":"crossref","first-page":"1375","DOI":"10.1093\/bioinformatics\/btu839","article-title":"A Bayesian framework for de novo mutation calling in parents-offspring trios","volume":"31","author":"Wei","year":"2014","journal-title":"Bioinformatics"},{"key":"2024011010212342300_btad775-B24","doi-asserted-by":"crossref","first-page":"1155","DOI":"10.1038\/s41587-019-0217-9","article-title":"Accurate circular consensus long-read sequencing improves variant detection and assembly of a human genome","volume":"37","author":"Wenger","year":"2019","journal-title":"Nat Biotechnol"},{"key":"2024011010212342300_btad775-B25","author":"Yun","year":"2020"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btad775\/55024474\/btad775.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/1\/btad775\/55265022\/btad775.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/1\/btad775\/55265022\/btad775.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,10]],"date-time":"2024-01-10T10:21:45Z","timestamp":1704882105000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btad775\/7510834"}},"subtitle":[],"editor":[{"given":"Alfonso","family":"Valencia","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2024,1,1]]},"references-count":25,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2024,1,2]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btad775","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,1,1]]},"published":{"date-parts":[[2024,1,1]]},"article-number":"btad775"}}